diff --git a/.buildinfo b/.buildinfo index 27a87357..484d9715 100644 --- a/.buildinfo +++ b/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: e76f7632e565cc4f22371a1a0bdd3b1b +config: ceac66979c4f4b0ddfd64e2546c7040b tags: d77d1c0d9ca2f4c8421862c7c5a0d620 diff --git a/_downloads/315c4c52fb68082a731b192d944e2ede/tutorials_python.zip b/_downloads/315c4c52fb68082a731b192d944e2ede/tutorials_python.zip index 4cd5ca50..dfcb475b 100644 Binary files a/_downloads/315c4c52fb68082a731b192d944e2ede/tutorials_python.zip and b/_downloads/315c4c52fb68082a731b192d944e2ede/tutorials_python.zip differ diff --git a/_downloads/a5659940aa3f8f568547d47752a43172/tutorials_jupyter.zip b/_downloads/a5659940aa3f8f568547d47752a43172/tutorials_jupyter.zip index eb9c549d..f5d4fe8f 100644 Binary files a/_downloads/a5659940aa3f8f568547d47752a43172/tutorials_jupyter.zip and b/_downloads/a5659940aa3f8f568547d47752a43172/tutorials_jupyter.zip differ diff --git a/datasets/D4RL/minigrid/fourrooms-random-v0/index.html b/datasets/D4RL/minigrid/fourrooms-random-v0/index.html index 48c895fc..df3724e6 100644 --- a/datasets/D4RL/minigrid/fourrooms-random-v0/index.html +++ b/datasets/D4RL/minigrid/fourrooms-random-v0/index.html @@ -441,7 +441,7 @@

Environment Specs

Observation Space

-

Dict('direction': Discrete(4), 'image': Box(0, 255, (7, 7, 3), uint8), 'mission': MissionSpace(<function FourRoomsEnv._gen_mission at 0x7f91331ee3a0>, None))

+

Dict('direction': Discrete(4), 'image': Box(0, 255, (7, 7, 3), uint8), 'mission': MissionSpace(<function FourRoomsEnv._gen_mission at 0x7f81d3e221f0>, None))

Action Space

Discrete(7)

diff --git a/datasets/D4RL/minigrid/fourrooms-v0/index.html b/datasets/D4RL/minigrid/fourrooms-v0/index.html index 703a2bf1..524344c1 100644 --- a/datasets/D4RL/minigrid/fourrooms-v0/index.html +++ b/datasets/D4RL/minigrid/fourrooms-v0/index.html @@ -441,7 +441,7 @@

Environment Specs

Observation Space

-

Dict('direction': Discrete(4), 'image': Box(0, 255, (7, 7, 3), uint8), 'mission': MissionSpace(<function FourRoomsEnv._gen_mission at 0x7f91331ee3a0>, None))

+

Dict('direction': Discrete(4), 'image': Box(0, 255, (7, 7, 3), uint8), 'mission': MissionSpace(<function FourRoomsEnv._gen_mission at 0x7f81d3e221f0>, None))

Action Space

Discrete(7)

diff --git a/release_notes/index.html b/release_notes/index.html index 38db2b44..3bdc0bbe 100644 --- a/release_notes/index.html +++ b/release_notes/index.html @@ -380,7 +380,7 @@

Release Notes

v0.5.1

-

Released on 2024-10-08 - GitHub - PyPI

+

Released on 2024-10-09 - GitHub - PyPI

Small bug fixes & Python 3.12 support.

What's Changed

    diff --git a/searchindex.js b/searchindex.js index 38ed3dc9..169c044a 100644 --- a/searchindex.js +++ b/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"0.1.0": [[56, "release-0-1-0"]], "0.2.2": [[56, "release-0-2-2"]], "1. Proportional Term (P)": [[61, "proportional-term-p"]], "2. Derivative Term (D)": [[61, "derivative-term-d"]], "3. Integral Term (I)": [[61, "integral-term-i"]], "404 - Page Not Found": [[0, null]], "Ant Maze": [[15, null]], "Attributes": [[3, "attributes"], [6, "attributes"], [7, "attributes"], [8, "attributes"], [9, "attributes"]], "Basic Usage": [[12, null]], "Behavioral cloning with PyTorch": [[65, null], [65, "id1"]], "Build the Documentation": [[1, "build-the-documentation"]], "Building a replay buffer": [[63, "building-a-replay-buffer"]], "Checkpoint Minari Dataset": [[12, "checkpoint-minari-dataset"]], "Cloned": [[22, null], [26, null], [38, null], [51, null]], "Collect Data and Create Minari Dataset": [[61, "collect-data-and-create-minari-dataset"]], "Collecting Data": [[12, "collecting-data"]], "Collecting a subset of a dictionary space with StepDataCallback": [[60, null]], "Combine Minari Datasets": [[10, "combine-minari-datasets"], [12, "combine-minari-datasets"]], "Combine datasets": [[14, "combine-datasets"]], "Complete": [[31, null]], "Content": [[15, "content"], [25, "content"], [29, "content"], [30, "content"], [32, "content"], [37, "content"], [41, "content"], [42, "content"], [54, "content"]], "Create Minari Dataset": [[10, "create-minari-dataset"], [12, "create-minari-dataset"]], "Create Namespace": [[11, "create-namespace"]], "D4RL": [[30, null]], "DataCollector": [[2, null]], "Dataset Creation": [[57, null], [59, null], [62, "dataset-creation"]], "Dataset Metadata": [[13, "dataset-metadata"]], "Dataset Specs": [[16, "dataset-specs"], [17, "dataset-specs"], [18, "dataset-specs"], [19, "dataset-specs"], [20, "dataset-specs"], [21, "dataset-specs"], [22, "dataset-specs"], [23, "dataset-specs"], [24, "dataset-specs"], [26, "dataset-specs"], [27, "dataset-specs"], [28, "dataset-specs"], [31, "dataset-specs"], [33, "dataset-specs"], [34, "dataset-specs"], [35, "dataset-specs"], [36, "dataset-specs"], [38, "dataset-specs"], [39, "dataset-specs"], [40, "dataset-specs"], [43, "dataset-specs"], [44, "dataset-specs"], [45, "dataset-specs"], [46, "dataset-specs"], [47, "dataset-specs"], [48, "dataset-specs"], [49, "dataset-specs"], [50, "dataset-specs"], [51, "dataset-specs"], [52, "dataset-specs"], [53, "dataset-specs"]], "Dataset Standards": [[13, null]], "Dataset generation": [[65, "dataset-generation"]], "Defining the model": [[63, "defining-the-model"]], "Delete Minari Datasets": [[10, "delete-minari-datasets"]], "Delete Namespace": [[11, "delete-namespace"]], "Delete local datasets": [[14, "delete-local-datasets"]], "Description": [[16, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [21, "description"], [22, "description"], [23, "description"], [24, "description"], [26, "description"], [27, "description"], [28, "description"], [31, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [38, "description"], [39, "description"], [40, "description"], [43, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"]], "Door": [[25, null]], "Download Datasets": [[12, "download-datasets"]], "Download Minari Dataset": [[10, "download-minari-dataset"]], "Download Namespace Metadata": [[11, "download-namespace-metadata"]], "Download datasets": [[14, "download-datasets"]], "Environment Specs": [[16, "environment-specs"], [17, "environment-specs"], [18, "environment-specs"], [19, "environment-specs"], [20, "environment-specs"], [21, "environment-specs"], [22, "environment-specs"], [23, "environment-specs"], [24, "environment-specs"], [26, "environment-specs"], [27, "environment-specs"], [28, "environment-specs"], [31, "environment-specs"], [33, "environment-specs"], [34, "environment-specs"], [35, "environment-specs"], [36, "environment-specs"], [38, "environment-specs"], [39, "environment-specs"], [40, "environment-specs"], [43, "environment-specs"], [44, "environment-specs"], [45, "environment-specs"], [46, "environment-specs"], [47, "environment-specs"], [48, "environment-specs"], [49, "environment-specs"], [50, "environment-specs"], [51, "environment-specs"], [52, "environment-specs"], [53, "environment-specs"]], "EpisodeBuffer": [[3, null]], "EpisodeData": [[6, null]], "EpisodeData Structure": [[13, "episodedata-structure"]], "EpisodeMetadataCallback": [[4, null]], "Evaluation Environment Specs": [[16, "evaluation-environment-specs"], [17, "evaluation-environment-specs"], [18, "evaluation-environment-specs"], [19, "evaluation-environment-specs"], [20, "evaluation-environment-specs"], [21, "evaluation-environment-specs"], [22, "evaluation-environment-specs"], [23, "evaluation-environment-specs"], [24, "evaluation-environment-specs"], [26, "evaluation-environment-specs"], [27, "evaluation-environment-specs"], [28, "evaluation-environment-specs"], [31, "evaluation-environment-specs"], [33, "evaluation-environment-specs"], [34, "evaluation-environment-specs"], [35, "evaluation-environment-specs"], [36, "evaluation-environment-specs"], [38, "evaluation-environment-specs"], [39, "evaluation-environment-specs"], [40, "evaluation-environment-specs"], [43, "evaluation-environment-specs"], [44, "evaluation-environment-specs"], [45, "evaluation-environment-specs"], [46, "evaluation-environment-specs"], [47, "evaluation-environment-specs"], [48, "evaluation-environment-specs"], [49, "evaluation-environment-specs"], [50, "evaluation-environment-specs"], [51, "evaluation-environment-specs"], [52, "evaluation-environment-specs"], [53, "evaluation-environment-specs"]], "Expert": [[23, null], [27, null], [39, null], [52, null]], "Filter Episodes": [[12, "filter-episodes"]], "For headless environments": [[63, "for-headless-environments"]], "Fourrooms": [[36, null]], "Fourrooms-Random": [[35, null]], "Get Local Namespace Metadata": [[11, "get-local-namespace-metadata"]], "Hammer": [[29, null]], "Human": [[24, null], [28, null], [40, null], [53, null]], "Implicit Q-Learning": [[63, "implicit-q-learning"]], "Implicit Q-Learning with TorchRL": [[63, null]], "Imports": [[65, "imports"]], "Installation": [[12, "installation"]], "Kitchen": [[32, null]], "Large": [[44, null]], "Large-Dense": [[43, null]], "Large-Diverse": [[16, null]], "Large-Play": [[17, null]], "List Minari Datasets": [[10, "list-minari-datasets"]], "List Namespaces": [[11, "list-namespaces"]], "List datasets": [[14, "list-datasets"]], "Load Local Datasets": [[12, "load-local-datasets"]], "Load Minari Dataset": [[10, "load-minari-dataset"]], "Loss and optimizer": [[63, "loss-and-optimizer"]], "Medium": [[46, null]], "Medium-Dense": [[45, null]], "Medium-Diverse": [[18, null]], "Medium-Play": [[19, null]], "Methods": [[2, "methods"], [3, "methods"], [4, "methods"], [5, "methods"], [7, "methods"], [8, "methods"]], "Minari": [[10, null]], "Minari CLI": [[14, null]], "Minari Dataset Directory": [[13, "minari-dataset-directory"]], "Minari documentation": [[1, null]], "MinariDataset": [[7, null]], "MinariStorage": [[8, null]], "MiniGrid": [[37, null]], "Mixed": [[33, null]], "Modified StepDataCallback": [[61, "modified-stepdatacallback"]], "Namespace": [[11, null]], "Namespace metadata": [[13, "namespace-metadata"]], "Normalize Score": [[10, "normalize-score"]], "Observation and Action Spaces": [[13, "observation-and-action-spaces"]], "Open": [[48, null]], "Open-Dense": [[47, null]], "Partial": [[34, null]], "Pen": [[41, null]], "Point Maze": [[42, null]], "PointMaze D4RL dataset": [[61, null]], "Policy training": [[65, "policy-training"]], "Pre-requisites": [[63, "pre-requisites"]], "Recover Environment": [[12, "recover-environment"]], "References": [[15, "references"], [25, "references"], [29, "references"], [32, "references"], [37, "references"], [41, "references"], [42, "references"], [54, "references"], [61, "references"]], "Release Notes": [[56, null]], "Relocate": [[54, null]], "Results": [[63, "results"]], "Sampling Episodes": [[12, "sampling-episodes"]], "Save Dataset": [[12, "save-dataset"]], "Serializing a custom space": [[58, null]], "Show datasets details": [[14, "show-datasets-details"]], "Split Dataset": [[12, "split-dataset"]], "Split Minari Dataset": [[10, "split-minari-dataset"]], "StepData": [[9, null]], "StepDataCallback": [[5, null]], "Supported Spaces": [[13, "supported-spaces"]], "The Adroit Pen environment": [[63, "the-adroit-pen-environment"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Training": [[63, "training"]], "Tutorials": [[62, null]], "Umaze": [[21, null], [50, null]], "Umaze-Dense": [[49, null]], "Umaze-Diverse": [[20, null]], "Update Namespace": [[11, "update-namespace"]], "Upload Namespace": [[11, "upload-namespace"]], "Upload datasets": [[14, "upload-datasets"]], "Using Datasets": [[62, "using-datasets"], [64, null], [66, null]], "Using Minari Datasets": [[12, "using-minari-datasets"]], "Using Namespaces": [[12, "using-namespaces"]], "WayPoint Planner": [[61, "waypoint-planner"]], "Waypoint Controller": [[61, "waypoint-controller"]], "minari.DataCollector": [[2, "minari-datacollector"]], "minari.EpisodeData": [[6, "minari-episodedata"]], "minari.EpisodeMetadataCallback": [[4, "minari-episodemetadatacallback"]], "minari.MinariDataset": [[7, "minari-minaridataset"]], "minari.StepData": [[9, "minari-stepdata"]], "minari.StepDataCallback": [[5, "minari-stepdatacallback"]], "minari.data_collector.EpisodeBuffer": [[3, "minari-data-collector-episodebuffer"]], "minari.dataset.minari_storage.MinariStorage": [[8, "minari-dataset-minari-storage-minaristorage"]], "v0.3.0": [[56, "release-v0-3-0"]], "v0.3.1": [[56, "release-v0-3-1"]], "v0.4.0": [[56, "release-v0-4-0"]], "v0.4.1": [[56, "release-v0-4-1"]], "v0.4.2": [[56, "release-v0-4-2"]], "v0.4.3": [[56, "release-v0-4-3"]], "v0.5.0": [[56, "release-v0-5-0"]], "v0.5.1": [[56, "release-v0-5-1"]]}, "docnames": ["404", "README", "api/data_collector", "api/data_collector/episode_buffer", "api/data_collector/episode_metadata_callback", "api/data_collector/step_data_callback", "api/minari_dataset/episode_data", "api/minari_dataset/minari_dataset", "api/minari_dataset/minari_storage", "api/minari_dataset/step_data", "api/minari_functions", "api/namespace/namespace", "content/basic_usage", "content/dataset_standards", "content/minari_cli", "datasets/D4RL/antmaze/index", "datasets/D4RL/antmaze/large-diverse-v1", "datasets/D4RL/antmaze/large-play-v1", "datasets/D4RL/antmaze/medium-diverse-v1", "datasets/D4RL/antmaze/medium-play-v1", "datasets/D4RL/antmaze/umaze-diverse-v1", "datasets/D4RL/antmaze/umaze-v1", "datasets/D4RL/door/cloned-v2", "datasets/D4RL/door/expert-v2", "datasets/D4RL/door/human-v2", "datasets/D4RL/door/index", "datasets/D4RL/hammer/cloned-v2", "datasets/D4RL/hammer/expert-v2", "datasets/D4RL/hammer/human-v2", "datasets/D4RL/hammer/index", "datasets/D4RL/index", "datasets/D4RL/kitchen/complete-v2", "datasets/D4RL/kitchen/index", "datasets/D4RL/kitchen/mixed-v2", "datasets/D4RL/kitchen/partial-v2", "datasets/D4RL/minigrid/fourrooms-random-v0", "datasets/D4RL/minigrid/fourrooms-v0", "datasets/D4RL/minigrid/index", "datasets/D4RL/pen/cloned-v2", "datasets/D4RL/pen/expert-v2", "datasets/D4RL/pen/human-v2", "datasets/D4RL/pen/index", "datasets/D4RL/pointmaze/index", "datasets/D4RL/pointmaze/large-dense-v2", "datasets/D4RL/pointmaze/large-v2", "datasets/D4RL/pointmaze/medium-dense-v2", "datasets/D4RL/pointmaze/medium-v2", "datasets/D4RL/pointmaze/open-dense-v2", "datasets/D4RL/pointmaze/open-v2", "datasets/D4RL/pointmaze/umaze-dense-v2", "datasets/D4RL/pointmaze/umaze-v2", "datasets/D4RL/relocate/cloned-v2", "datasets/D4RL/relocate/expert-v2", "datasets/D4RL/relocate/human-v2", "datasets/D4RL/relocate/index", "index", "release_notes/index", "tutorials/dataset_creation/README", "tutorials/dataset_creation/custom_space_serialization", "tutorials/dataset_creation/index", "tutorials/dataset_creation/observation_space_subseting", "tutorials/dataset_creation/point_maze_dataset", "tutorials/index", "tutorials/using_datasets/IQL_torchrl", "tutorials/using_datasets/README", "tutorials/using_datasets/behavioral_cloning", "tutorials/using_datasets/index"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/data_collector.md", "api/data_collector/episode_buffer.md", "api/data_collector/episode_metadata_callback.md", "api/data_collector/step_data_callback.md", "api/minari_dataset/episode_data.md", "api/minari_dataset/minari_dataset.md", "api/minari_dataset/minari_storage.md", "api/minari_dataset/step_data.md", "api/minari_functions.md", "api/namespace/namespace.md", "content/basic_usage.md", "content/dataset_standards.md", "content/minari_cli.md", "datasets/D4RL/antmaze/index.md", "datasets/D4RL/antmaze/large-diverse-v1.md", "datasets/D4RL/antmaze/large-play-v1.md", "datasets/D4RL/antmaze/medium-diverse-v1.md", "datasets/D4RL/antmaze/medium-play-v1.md", "datasets/D4RL/antmaze/umaze-diverse-v1.md", "datasets/D4RL/antmaze/umaze-v1.md", "datasets/D4RL/door/cloned-v2.md", "datasets/D4RL/door/expert-v2.md", "datasets/D4RL/door/human-v2.md", "datasets/D4RL/door/index.md", "datasets/D4RL/hammer/cloned-v2.md", "datasets/D4RL/hammer/expert-v2.md", "datasets/D4RL/hammer/human-v2.md", "datasets/D4RL/hammer/index.md", "datasets/D4RL/index.md", "datasets/D4RL/kitchen/complete-v2.md", "datasets/D4RL/kitchen/index.md", "datasets/D4RL/kitchen/mixed-v2.md", "datasets/D4RL/kitchen/partial-v2.md", "datasets/D4RL/minigrid/fourrooms-random-v0.md", "datasets/D4RL/minigrid/fourrooms-v0.md", "datasets/D4RL/minigrid/index.md", "datasets/D4RL/pen/cloned-v2.md", "datasets/D4RL/pen/expert-v2.md", "datasets/D4RL/pen/human-v2.md", "datasets/D4RL/pen/index.md", "datasets/D4RL/pointmaze/index.md", "datasets/D4RL/pointmaze/large-dense-v2.md", "datasets/D4RL/pointmaze/large-v2.md", "datasets/D4RL/pointmaze/medium-dense-v2.md", "datasets/D4RL/pointmaze/medium-v2.md", "datasets/D4RL/pointmaze/open-dense-v2.md", "datasets/D4RL/pointmaze/open-v2.md", "datasets/D4RL/pointmaze/umaze-dense-v2.md", "datasets/D4RL/pointmaze/umaze-v2.md", "datasets/D4RL/relocate/cloned-v2.md", "datasets/D4RL/relocate/expert-v2.md", "datasets/D4RL/relocate/human-v2.md", "datasets/D4RL/relocate/index.md", "index.md", "release_notes/index.md", "tutorials/dataset_creation/README.rst", "tutorials/dataset_creation/custom_space_serialization.rst", "tutorials/dataset_creation/index.rst", "tutorials/dataset_creation/observation_space_subseting.rst", "tutorials/dataset_creation/point_maze_dataset.rst", "tutorials/index.rst", "tutorials/using_datasets/IQL_torchrl.rst", "tutorials/using_datasets/README.rst", "tutorials/using_datasets/behavioral_cloning.rst", "tutorials/using_datasets/index.rst"], "indexentries": {"__call__() (in module minari.episodemetadatacallback)": [[4, "minari.EpisodeMetadataCallback.__call__", false]], "__call__() (in module minari.stepdatacallback)": [[5, "minari.StepDataCallback.__call__", false]], "__len__() (in module minari.data_collector.episodebuffer)": [[3, "minari.data_collector.EpisodeBuffer.__len__", false]], "action (minari.stepdata attribute)": [[9, "minari.StepData.action", false]], "action_space (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.action_space", false]], "actions (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.actions", false]], "actions (minari.episodedata attribute)": [[6, "minari.EpisodeData.actions", false]], "add_step_data() (in module minari.data_collector.episodebuffer)": [[3, "minari.data_collector.EpisodeBuffer.add_step_data", false]], "add_to_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.add_to_dataset", false]], "apply() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.apply", false]], "close() (in module minari.datacollector)": [[2, "minari.DataCollector.close", false]], "combine_datasets() (in module minari)": [[10, "minari.combine_datasets", false]], "create_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.create_dataset", false]], "create_dataset_from_buffers() (in module minari)": [[10, "minari.create_dataset_from_buffers", false]], "create_namespace() (in module minari.namespace)": [[11, "minari.namespace.create_namespace", false]], "data_path (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.data_path", false]], "datacollector (class in minari)": [[2, "minari.DataCollector", false]], "delete_dataset() (in module minari)": [[10, "minari.delete_dataset", false]], "delete_namespace() (in module minari.namespace)": [[11, "minari.namespace.delete_namespace", false]], "download_dataset() (in module minari)": [[10, "minari.download_dataset", false]], "download_namespace_metadata() (in module minari.namespace)": [[11, "minari.namespace.download_namespace_metadata", false]], "episode_indices (minari.minaridataset attribute)": [[7, "minari.MinariDataset.episode_indices", false]], "episodebuffer (class in minari.data_collector)": [[3, "minari.data_collector.EpisodeBuffer", false]], "episodedata (class in minari)": [[6, "minari.EpisodeData", false]], "episodemetadatacallback (class in minari)": [[4, "minari.EpisodeMetadataCallback", false]], "filter_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.filter_episodes", false]], "get_episode_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_episode_metadata", false]], "get_episodes() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_episodes", false]], "get_namespace_metadata() (in module minari.namespace)": [[11, "minari.namespace.get_namespace_metadata", false]], "get_normalized_score() (in module minari)": [[10, "minari.get_normalized_score", false]], "get_size() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_size", false]], "id (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.id", false]], "id (minari.episodedata attribute)": [[6, "minari.EpisodeData.id", false]], "info (minari.stepdata attribute)": [[9, "minari.StepData.info", false]], "infos (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.infos", false]], "infos (minari.episodedata attribute)": [[6, "minari.EpisodeData.infos", false]], "iterate_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.iterate_episodes", false]], "list_local_datasets() (in module minari)": [[10, "minari.list_local_datasets", false]], "list_local_namespaces() (in module minari.namespace)": [[11, "minari.namespace.list_local_namespaces", false]], "list_remote_datasets() (in module minari)": [[10, "minari.list_remote_datasets", false]], "list_remote_namespaces() (in module minari.namespace)": [[11, "minari.namespace.list_remote_namespaces", false]], "load_dataset() (in module minari)": [[10, "minari.load_dataset", false]], "metadata (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.metadata", false]], "minaridataset (class in minari)": [[7, "minari.MinariDataset", false]], "minaristorage (class in minari.dataset.minari_storage)": [[8, "minari.dataset.minari_storage.MinariStorage", false]], "new() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.new", false]], "observation (minari.stepdata attribute)": [[9, "minari.StepData.observation", false]], "observation_space (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.observation_space", false]], "observations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.observations", false]], "observations (minari.episodedata attribute)": [[6, "minari.EpisodeData.observations", false]], "read() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.read", false]], "recover_environment() (in module minari.minaridataset)": [[7, "minari.MinariDataset.recover_environment", false]], "reset() (in module minari.datacollector)": [[2, "minari.DataCollector.reset", false]], "rewards (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.rewards", false]], "sample_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.sample_episodes", false]], "seed (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.seed", false]], "set_seed() (in module minari.minaridataset)": [[7, "minari.MinariDataset.set_seed", false]], "spec (minari.minaridataset attribute)": [[7, "minari.MinariDataset.spec", false]], "split_dataset() (in module minari)": [[10, "minari.split_dataset", false]], "step() (in module minari.datacollector)": [[2, "minari.DataCollector.step", false]], "stepdata (class in minari)": [[9, "minari.StepData", false]], "stepdatacallback (class in minari)": [[5, "minari.StepDataCallback", false]], "termination (minari.stepdata attribute)": [[9, "minari.StepData.termination", false]], "terminations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.terminations", false]], "terminations (minari.episodedata attribute)": [[6, "minari.EpisodeData.terminations", false]], "total_episodes (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.total_episodes", false]], "total_episodes (minari.minaridataset attribute)": [[7, "minari.MinariDataset.total_episodes", false]], "total_steps (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.total_steps", false]], "total_steps (minari.minaridataset attribute)": [[7, "minari.MinariDataset.total_steps", false]], "truncation (minari.stepdata attribute)": [[9, "minari.StepData.truncation", false]], "truncations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.truncations", false]], "truncations (minari.episodedata attribute)": [[6, "minari.EpisodeData.truncations", false]], "update_dataset_from_buffer() (in module minari.minaridataset)": [[7, "minari.MinariDataset.update_dataset_from_buffer", false]], "update_episode_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_episode_metadata", false]], "update_episodes() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_episodes", false]], "update_from_storage() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_from_storage", false]], "update_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_metadata", false]], "upload_namespace() (in module minari.namespace)": [[11, "minari.namespace.upload_namespace", false]]}, "objects": {"minari": [[2, 0, 1, "", "DataCollector"], [6, 0, 1, "", "EpisodeData"], [4, 0, 1, "", "EpisodeMetadataCallback"], [7, 0, 1, "", "MinariDataset"], [9, 0, 1, "", "StepData"], [5, 0, 1, "", "StepDataCallback"], [10, 1, 1, "", "combine_datasets"], [10, 1, 1, "", "create_dataset_from_buffers"], [10, 1, 1, "", "delete_dataset"], [10, 1, 1, "", "download_dataset"], [10, 1, 1, "", "get_normalized_score"], [10, 1, 1, "", "list_local_datasets"], [10, 1, 1, "", "list_remote_datasets"], [10, 1, 1, "", "load_dataset"], [10, 1, 1, "", "split_dataset"]], "minari.DataCollector": [[2, 1, 1, "", "add_to_dataset"], [2, 1, 1, "", "close"], [2, 1, 1, "", "create_dataset"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "step"]], "minari.EpisodeData": [[6, 2, 1, "", "actions"], [6, 2, 1, "", "id"], [6, 2, 1, "", "infos"], [6, 2, 1, "", "observations"], [6, 2, 1, "", "terminations"], [6, 2, 1, "", "truncations"]], "minari.EpisodeMetadataCallback": [[4, 1, 1, "", "__call__"]], "minari.MinariDataset": [[7, 2, 1, "", "episode_indices"], [7, 1, 1, "", "filter_episodes"], [7, 1, 1, "", "iterate_episodes"], [7, 1, 1, "", "recover_environment"], [7, 1, 1, "", "sample_episodes"], [7, 1, 1, "", "set_seed"], [7, 2, 1, "", "spec"], [7, 2, 1, "", "total_episodes"], [7, 2, 1, "", "total_steps"], [7, 1, 1, "", "update_dataset_from_buffer"]], "minari.StepData": [[9, 2, 1, "", "action"], [9, 2, 1, "", "info"], [9, 2, 1, "", "observation"], [9, 2, 1, "", "termination"], [9, 2, 1, "", "truncation"]], "minari.StepDataCallback": [[5, 1, 1, "", "__call__"]], "minari.data_collector": [[3, 0, 1, "", "EpisodeBuffer"]], "minari.data_collector.EpisodeBuffer": [[3, 1, 1, "", "__len__"], [3, 2, 1, "", "actions"], [3, 1, 1, "", "add_step_data"], [3, 2, 1, "", "id"], [3, 2, 1, "", "infos"], [3, 2, 1, "", "observations"], [3, 2, 1, "", "rewards"], [3, 2, 1, "", "seed"], [3, 2, 1, "", "terminations"], [3, 2, 1, "", "truncations"]], "minari.dataset.minari_storage": [[8, 0, 1, "", "MinariStorage"]], "minari.dataset.minari_storage.MinariStorage": [[8, 2, 1, "", "action_space"], [8, 1, 1, "", "apply"], [8, 2, 1, "", "data_path"], [8, 1, 1, "", "get_episode_metadata"], [8, 1, 1, "", "get_episodes"], [8, 1, 1, "", "get_size"], [8, 2, 1, "", "metadata"], [8, 1, 1, "", "new"], [8, 2, 1, "", "observation_space"], [8, 1, 1, "", "read"], [8, 2, 1, "", "total_episodes"], [8, 2, 1, "", "total_steps"], [8, 1, 1, "", "update_episode_metadata"], [8, 1, 1, "", "update_episodes"], [8, 1, 1, "", "update_from_storage"], [8, 1, 1, "", "update_metadata"]], "minari.namespace": [[11, 1, 1, "", "create_namespace"], [11, 1, 1, "", "delete_namespace"], [11, 1, 1, "", "download_namespace_metadata"], [11, 1, 1, "", "get_namespace_metadata"], [11, 1, 1, "", "list_local_namespaces"], [11, 1, 1, "", "list_remote_namespaces"], [11, 1, 1, "", "upload_namespace"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "function", "Python function"], "2": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:class", "1": "py:function", "2": "py:attribute"}, "terms": {"": [2, 4, 5, 10, 12, 13, 14, 16, 17, 18, 19, 20, 32, 56, 58, 60, 61, 63, 65], "0": [2, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 60, 61, 63, 65], "000": [61, 63], "0003": 63, "005": 63, "01": 56, "0123456789abcdefghijklmnopqrstuvwxyzabcdeeeffghijklmnnoopqrrssttuvwxyzz": [35, 36], "03ac13": [14, 55], "04": 56, "05": 56, "07": 56, "07219": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "08": 56, "09": 56, "0x11f2608b0": 58, "0x12253a940": 58, "0x7f91331ee3a0": [35, 36], "1": [2, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 63, 65], "10": [12, 13, 56, 58, 60, 61, 63], "100": [2, 10, 12, 14, 38, 39, 40, 55, 56, 63], "1000": [12, 16, 17, 18, 19, 56, 63], "1000000": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 26, 27, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55], "1000070": 35, "10010": 36, "1006729": 12, "10087": [25, 29, 41, 54], "101": 56, "10174": 35, "102": 56, "104": 56, "105": 56, "107": 56, "1077": [14, 55], "108": 56, "109": 56, "1096": [12, 14, 55], "10_000": [61, 63], "11": 56, "110": 56, "1103": 12, "111": 56, "112": 56, "11310": 28, "116": 56, "11956": 32, "12": [12, 56, 63], "121": 56, "123": [12, 56, 61], "124": 56, "126": 56, "128": [56, 63, 65], "129": 56, "13": [12, 56], "130": 56, "132": 56, "13210": [49, 50], "133": 56, "137": 56, "139": 56, "14": [35, 36, 56], "1400": 63, "1430": [20, 21], "144": 56, "148": 56, "15": 12, "151": 56, "153": 56, "155": 56, "156560": [33, 34], "157": 56, "158": 56, "160": 56, "161": 56, "162": 56, "163": 56, "164": 56, "165": 56, "167": 56, "169": 56, "16x16": 58, "17": [12, 56], "170": 56, "1709": [25, 29, 41, 54], "171": 56, "172": 56, "177": 56, "18": [12, 56], "183": 56, "1872": 63, "19": [12, 31, 56], "1910": 32, "196": 56, "1_000": [63, 65], "1e": 61, "1f": 63, "2": [2, 10, 12, 15, 16, 17, 18, 19, 20, 21, 25, 29, 30, 31, 32, 33, 34, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 58, 60, 63], "20": [12, 56, 63], "200": [22, 23, 24, 26, 27, 28, 51, 52, 53], "2004": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "2017": [25, 29, 41, 54], "2019": 32, "2020": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "2021": [15, 63], "2022": 56, "2023": [56, 63], "2024": 56, "2059": 12, "21": 12, "211": 56, "218": 56, "22": [12, 15, 56], "224": 56, "23": 12, "239": 56, "24": [14, 25, 29, 38, 39, 40, 41, 54, 63], "240": 56, "241": 56, "244": 56, "245": 56, "25": [12, 14, 24, 25, 28, 29, 40, 41, 53, 54, 55, 56, 63], "255": [35, 36, 58], "256": [63, 65], "26": [26, 27, 28, 56], "268": 15, "27": [16, 17, 18, 19, 20, 21, 56], "28": [12, 22, 23, 24, 56], "280": 31, "29": 56, "2d": [15, 30], "2f": 63, "3": [2, 10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 63], "30": [51, 52, 53, 63], "300": [47, 48, 49, 50], "305": 56, "31": 56, "32": 65, "3360": [43, 44], "34": 56, "3606": 26, "3736": [14, 38], "3758": 51, "39": [12, 22, 23, 24, 51, 52, 53], "4": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 60, 61], "42": [58, 60, 63, 65], "4209": 31, "4356": [14, 55], "4358": 22, "45": [14, 38, 39, 40, 63], "450": [33, 34], "46": [26, 27, 28], "4752": [45, 46], "480": 63, "4958": [14, 39], "499206": [14, 39], "5": [12, 14, 61, 63], "50": [22, 25, 26, 29, 38, 41, 51, 54, 61, 63], "500": 65, "5000": [12, 14, 23, 27, 40, 52, 55, 63], "500000": [14, 38], "5025": 12, "50_000": 63, "52": 56, "54": 56, "55": 56, "57": 56, "59": [31, 33, 34], "590": 36, "6": [12, 56], "60": 56, "600": [45, 46], "604": 14, "605": 12, "621": [33, 34], "638": 14, "6729": [12, 14, 24, 55], "69": 63, "7": [12, 14, 31, 33, 34, 35, 36, 55, 56, 58, 63], "700": [20, 21], "71": 56, "73": 56, "75": 56, "77": 56, "8": [12, 15, 16, 17, 18, 19, 20, 21, 30, 42, 56, 61], "80": [16, 17, 18, 19, 56], "800": [43, 44], "82": 56, "83": 56, "84": 56, "86": 56, "87": 56, "88": 56, "884": 63, "9": [12, 31, 33, 34], "90": [20, 21, 56], "900": 63, "92": 56, "93": 56, "95": 56, "9525": [47, 48], "96": 56, "99": [56, 61, 63], "9942": 53, "A": [2, 8, 13, 32, 55, 61, 63], "And": 65, "As": [6, 13, 56, 61, 65], "At": [16, 17, 18, 19, 20], "But": [58, 63], "By": [61, 63], "For": [1, 2, 10, 11, 12, 13, 30, 56, 58, 61, 65], "If": [2, 7, 8, 10, 11, 12, 13, 14, 56, 58, 61, 63], "In": [12, 13, 56, 58, 60, 61, 63, 65], "It": [56, 61, 63], "No": 58, "Not": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 51, 52, 53], "On": [13, 61, 63], "The": [2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 60, 61, 65], "Then": [58, 61, 63], "There": [12, 25, 29, 41, 54, 63], "These": [10, 14, 25, 29, 30, 32, 41, 42, 54, 56, 61], "To": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 63, 65], "With": 14, "_": [2, 12, 58, 60, 61, 63, 65], "_0": 61, "__call__": [4, 5, 60, 61], "__init__": [61, 65], "__len__": 3, "_build": 1, "_check_valid_cel": 61, "_gen_miss": [35, 36, 58], "_index_0": 56, "_index_1": 56, "_max": 10, "_min": 10, "_score": 10, "_script": 56, "a1efe4": [14, 55], "a256f8": 14, "a5a5a1": 14, "a_hat": 65, "a_pr": 65, "a_t": 63, "ab": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "abil": 12, "abl": [12, 42], "abort": 14, "about": [1, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58], "abov": [12, 56, 58, 60, 63], "abspath": 65, "abstract": 12, "ac": 65, "access": [8, 12, 14, 56, 61], "account": 61, "accumul": [16, 17, 18, 19, 20, 21, 61, 65], "accumulated_rew": 65, "accur": 63, "achiev": [12, 61, 65], "achieved_go": [16, 17, 18, 19, 20, 21, 31, 33, 34, 43, 44, 45, 46, 47, 48, 49, 50, 60, 61], "achieved_goal_cel": 61, "acrobot": 12, "across": [10, 13, 56], "act": 56, "action": [2, 3, 5, 6, 8, 9, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "action_id": 61, "action_idx": 61, "action_spac": [2, 8, 10, 12, 13, 56, 58, 60, 61, 65], "action_space_subset": 60, "action_spec": 63, "activ": [15, 63], "activation_class": 63, "activation_fn": 63, "actor": 63, "actor_extractor": 63, "actor_mlp": 63, "actor_modul": 63, "actor_net": 63, "acttyp": [2, 10], "actual": 61, "actuat": [30, 42], "ad": [5, 7, 8, 10, 12, 13, 43, 44, 45, 46, 47, 48, 49, 50, 56, 60], "adam": [15, 63, 65], "add": [2, 3, 4, 5, 7, 8, 14, 43, 44, 45, 46, 47, 48, 49, 50, 56, 61, 63], "add_step_data": 3, "add_to_dataset": [2, 12], "addit": [2, 5, 7, 11, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "addition": [15, 56], "additional_dataset": 56, "additional_group": 56, "additional_wrapp": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "address": 61, "adher": 56, "adjust": 61, "adroit_door": [22, 23, 24], "adroit_h": 14, "adroit_hamm": [26, 27, 28], "adroit_hand": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 51, 52, 53], "adroit_pen": [14, 38, 39, 40], "adroit_reloc": [51, 52, 53], "adroithanddoor": [12, 13, 22, 23, 24, 25, 30, 56], "adroithanddoorenv": [22, 23, 24], "adroithandhamm": [26, 27, 28, 29, 30, 56], "adroithandhammerenv": [26, 27, 28], "adroithandpen": [14, 30, 38, 39, 40, 41, 56, 63], "adroithandpenenv": [38, 39, 40], "adroithandreloc": [30, 51, 52, 53, 54, 56], "adroithandrelocateenv": [51, 52, 53], "advantag": [61, 63], "after": [2, 4, 6, 9, 10, 13, 14, 56, 61, 65], "again": [16, 17, 18, 19, 20, 21], "agent": [9, 15, 16, 17, 18, 19, 20, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 60, 61, 63, 65], "aggress": 61, "agnost": [2, 63], "aim": [13, 61, 63], "al": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61, 63], "alex": [12, 16, 17, 18, 19, 20, 21], "alexdavei": 56, "alexdavey0": [16, 17, 18, 19, 20, 21], "algo": 65, "algorithm": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 63], "algorithm_nam": [2, 10, 12, 13, 58, 60, 61, 65], "all": [8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 30, 31, 32, 55, 56, 58, 62, 63, 65], "allow": [12, 13, 56, 61, 65], "alon": 61, "along": [30, 42], "alreadi": [8, 12, 14, 56, 60, 61, 63], "also": [10, 12, 14, 16, 17, 18, 19, 20, 21, 55, 56, 58, 60, 61, 63], "alwai": 61, "among": 56, "amount": [12, 61], "amp": 56, "an": [4, 7, 10, 11, 12, 13, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 47, 48, 51, 52, 53, 54, 56, 58, 61, 63], "ani": [2, 5, 6, 7, 8, 9, 10, 11, 12, 56, 60, 61], "annot": 56, "anoth": [2, 5, 8, 12, 13, 25, 29, 41, 54, 61, 63], "anssi": 15, "ant": [16, 17, 18, 19, 20, 21, 30], "ant_maze_v4": [16, 17, 18, 19, 20, 21], "antmaz": [12, 16, 17, 18, 19, 20, 21], "antmaze_larg": [15, 17], "antmaze_large_diverse_gr": [15, 16], "antmaze_medium": [15, 19], "antmaze_medium_diverse_gr": [15, 18], "antmaze_umaz": [15, 20, 21], "antmazeenv": [16, 17, 18, 19, 20, 21], "antonin": 15, "apart": 56, "api": [11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 61, 65], "appear": [12, 56], "append": [3, 8, 12, 56, 63], "appli": [8, 58], "applic": [12, 56], "appreci": 56, "approach": 61, "appropri": 13, "approx": 63, "approxim": 63, "apr": [15, 42, 61], "apt": 63, "ar": [2, 6, 8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 51, 52, 53, 54, 55, 56, 58, 61, 63], "arang": 63, "aravind": [25, 29, 41, 54], "aravindr93": 14, "arbitrari": [13, 56], "arbitrarili": 13, "arena": [42, 47, 48], "arg": [14, 56, 61, 63], "argmax": [61, 65], "argument": [4, 5, 10, 12, 13, 56], "argv": 65, "around": [58, 63], "arrai": [10, 61], "arrow": [13, 56], "arxiv": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "as_tensor": 65, "ashlei": 15, "assert": [22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 58, 65], "assign": 10, "associ": 13, "attach": 13, "attempt": 63, "attr": 56, "attribut": [2, 4, 10, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56], "author": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 61, 65], "author_email": [2, 10, 12, 13, 56, 58, 61, 65], "auto": [63, 65], "auto_cast_to_devic": 63, "autobuild": 1, "automat": [1, 2, 13, 56], "autoreset": 14, "auxiliari": 2, "avail": [7, 10, 12, 14, 55, 56, 58, 63], "averag": [2, 10, 63], "avg": 63, "avjmachin": 56, "avoid": [56, 63], "awai": 56, "ax": 63, "axi": [30, 42, 61, 63], "b": [1, 14, 55], "b64encod": 63, "back": [58, 61], "background": 56, "backpropag": 63, "backward": [63, 65], "badg": 56, "balanc": 65, "balisujohn": 56, "ball": [15, 30, 42, 54, 61], "bamboofungu": 56, "bar": 14, "base": [12, 14, 56, 61, 63], "base64": 63, "base_env": 63, "baselin": 15, "baselines3": [15, 65], "basi": 56, "basic": [56, 63], "batch": [63, 65], "batch_first": 65, "batch_siz": [63, 65], "becaus": [15, 16, 17, 18, 19, 20, 21, 42, 63], "been": [12, 42, 56], "befor": [2, 12, 58, 61, 63], "begin": [16, 17, 18, 19, 20, 65], "behav": 63, "behavior": [56, 61, 62, 63, 66], "behavioral_clon": 65, "behaviour": 63, "being": [2, 10, 13, 31, 32, 33, 34, 42, 43, 45, 47, 49], "bellman": 61, "bellow": 56, "belong": 5, "below": [14, 61, 63], "benchmark": [30, 63], "best": 63, "best_model": 65, "beta": [56, 63], "between": [10, 43, 45, 47, 49, 61], "bias": 61, "bind": 61, "bit": [61, 63], "black": 56, "blob": [58, 61], "block": 63, "blue": 63, "board": 29, "bool": [2, 5, 7, 9, 10, 11, 56, 63], "boolean": 10, "both": [8, 13, 14, 58, 60], "bottom": [31, 33, 34], "bound": [13, 61, 63], "box": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 65], "break": [12, 56, 61, 65], "bucket": [12, 13, 55, 56], "buffer": [2, 3, 7, 8, 10, 12, 56], "bug": 56, "bugfix": 56, "build": [14, 56], "burner": [31, 33, 34], "c": [12, 16, 18, 32, 56], "cabinet": [31, 32, 33, 34], "cach": [2, 12, 56, 63], "calcul": [10, 63], "call": [2, 5, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56], "callabl": [2, 7, 8, 10, 12, 56, 58], "callback": [2, 4, 5, 56, 60, 61], "can": [2, 4, 5, 7, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "capabl": 12, "captur": 63, "care": 58, "cart": 65, "cartpol": [11, 12, 56, 65], "case": [12, 56, 61], "cd": [1, 12], "cell": [16, 18, 61], "cell_rowcol_to_xi": 61, "cell_to_st": 61, "cell_xy_to_rowcol": 61, "center": 14, "certain": [7, 12, 41], "cff": 56, "challeng": [15, 63], "chang": [1, 11, 56, 61], "changelog": 56, "characterist": [2, 61], "charg": 56, "charset": [13, 35, 36], "check": [12, 14, 56, 61], "checkpoint": 56, "choic": 63, "choos": [13, 58, 60], "chosen": 61, "ci": 56, "citat": 56, "class": [2, 3, 4, 5, 6, 7, 8, 9, 13, 56, 60, 61, 63, 65], "classic": [12, 61, 65], "classic_control": 12, "classif": 65, "clean": 58, "clear": 2, "clear_episode_buff": 56, "cli": [55, 56], "clip": 61, "clone": [1, 12, 14, 25, 29, 41, 54, 55, 56, 62, 63, 66], "close": [2, 32, 61, 63, 65], "cloud": [12, 13, 56], "cmmcirvin": 56, "code": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 62, 63, 65], "code_permalink": [2, 10, 12, 13, 58, 61, 65], "codelink": 56, "colab": 63, "collate_fn": 65, "collect": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 59, 62, 63], "collector": [2, 61], "collector_env": [56, 61], "collis": 61, "color": [14, 55], "com": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61], "combin": [56, 61], "combine_dataset": [10, 12, 56], "combined_dataset": 10, "come": [13, 14], "command": [12, 14, 56, 65], "commit": 56, "common": [12, 13], "compar": [6, 60], "comparison": 10, "compat": [10, 12, 14, 56, 65], "compatible_minari_vers": 10, "complement": 2, "complet": [32, 33, 34, 56, 63], "complex": [15, 25, 29, 30, 41, 54, 56], "compli": 56, "compliant": [13, 56], "compon": 61, "component_1": 56, "component_2": 56, "compris": 12, "comput": [2, 10, 12, 13, 63], "compute_act": 61, "compute_reward_matrix": 61, "compute_transition_matrix": 61, "concaten": 63, "condit": [7, 12, 56, 63], "configur": [32, 56, 63], "confirm": [14, 63], "conflict": 63, "conjunct": 63, "consid": [8, 56, 61, 63], "consider": 56, "consist": [13, 42, 63], "constantli": 56, "construct": 61, "contact": [11, 12, 58, 65], "contain": [1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 47, 48, 49, 50, 51, 52, 53, 56], "content": [13, 14], "continu": [10, 12, 13, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61], "continuing_task": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 61], "contribut": [1, 12, 56, 61], "contributor": 56, "control": [12, 15, 42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 63, 65], "conveni": 63, "convent": 56, "convers": [56, 58], "convert": [2, 61, 63], "coordin": 61, "copi": [56, 63], "core": 58, "corl": 63, "corr": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "correct": [56, 61, 63], "correspond": [2, 10, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 61, 65], "could": [15, 63], "cover": 63, "coverag": 56, "cpu": 63, "creat": [2, 5, 7, 8, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56, 58, 60, 63, 65], "create_dataset": [2, 12, 56, 58, 60, 61, 65], "create_dataset_from_buff": [10, 12, 13, 56], "create_dataset_from_collector_env": 56, "create_namespac": 11, "creation": [2, 12, 13, 56], "credenti": 11, "cross": 65, "crossentropyloss": 65, "cuda": 63, "cumul": [61, 63], "curat": 56, "current": [5, 10, 12, 13, 14, 56, 61, 63], "current_cel": 61, "current_control_target_id": 61, "current_control_target_xi": 61, "current_st": 61, "custom": [2, 4, 12, 56, 59, 61, 62], "custom_space_seri": 58, "customstepdatacallback": 5, "customsubsetstepdatacallback": 60, "cython": 56, "d": [12, 63], "d4rl": [10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 59, 62, 63], "da": 61, "dampen": 61, "dapg": [14, 23, 24, 25, 27, 28, 29, 39, 40, 41, 52, 53, 54], "data": [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 29, 30, 32, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 58, 63, 65], "data_collector": 60, "data_format": [2, 8, 10, 56], "data_path": 8, "data_url": 63, "databas": [10, 11, 14], "databefor": 2, "dataclass": [8, 56], "datacollector": [4, 12, 13, 56, 58, 60, 61, 65], "datacollectorv0": 56, "dataload": [12, 56, 65], "datas": 8, "dataset": [2, 4, 5, 6, 7, 11, 15, 25, 29, 30, 32, 37, 41, 42, 54, 55, 56, 58, 60, 63], "dataset_cr": [56, 58, 61], "dataset_id": [2, 10, 11, 12, 13, 56, 58, 60, 61, 63, 65], "dataset_nam": [2, 10, 13, 14, 61], "dataset_s": 56, "dataset_v1": 56, "dataset_v2": 56, "dataset_v3": 56, "datasets_to_combin": [10, 56], "davei": [12, 16, 17, 18, 19, 20, 21], "de": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 51, 52, 53], "decent": 63, "decod": 63, "deep": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "def": [5, 58, 60, 61, 63, 65], "default": [2, 5, 7, 8, 10, 11, 12, 13, 63], "default_interaction_typ": 63, "defin": [13, 58, 60, 65], "definit": 56, "del": [58, 60], "deleg": 56, "delet": [58, 60], "delete_dataset": [10, 58, 60], "delete_namespac": 11, "demonstr": [22, 24, 25, 26, 28, 29, 31, 32, 38, 40, 41, 51, 53, 54, 63], "dens": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 42, 51, 52, 53, 56, 63], "depend": [12, 13, 56], "deprec": 56, "descent": 63, "describ": [11, 13, 56], "descript": [2, 10, 11, 13, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 56], "deseri": 58, "deserialize_custom_spac": 58, "deserialize_spac": 58, "design": 63, "desir": [32, 61], "desired_cel": 61, "desired_go": [16, 17, 18, 19, 20, 21, 31, 33, 34, 43, 44, 45, 46, 47, 48, 49, 50, 60, 61], "detail": 63, "detect": 56, "determin": 61, "determinist": [12, 61], "develop": 56, "deviat": [13, 61], "devic": [14, 63], "dexter": [25, 29, 41, 54], "df8ff078652a": [15, 42, 61], "dict": [2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 16, 17, 18, 19, 20, 21, 31, 33, 34, 35, 36, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 60], "dict_kei": 60, "dictionari": [2, 3, 5, 7, 8, 9, 10, 12, 13, 56, 59, 61, 62, 63], "differ": [10, 12, 13, 42, 56, 58, 61, 63], "dimens": [63, 65], "dimension": [13, 25, 29, 41, 54], "dir": 56, "direct": [35, 36, 58, 63], "directli": [12, 56, 61, 63, 65], "directori": [2, 8, 11, 12, 63], "dirhtml": 1, "disabl": 2, "disable_env_check": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "discount": 61, "discret": [13, 35, 36, 56, 58, 61, 65], "disk": [8, 12, 13, 56, 58, 60, 65], "displai": [63, 65], "dist": 61, "distanc": [43, 45, 47, 49], "distribut": [25, 29, 41, 54, 63], "distribution_class": 63, "distribution_kwarg": 63, "divers": [12, 15], "divid": [12, 61], "do": [61, 63], "doc": [1, 56, 58, 61], "document": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "doe": 56, "doesn": [8, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56, 61], "dof": [15, 25, 29, 30, 41, 54, 63], "domain": [15, 25, 29, 30, 41, 42, 54], "don": [13, 56, 58, 60, 61], "done": [12, 61, 63, 65], "door": [10, 12, 13, 14, 22, 23, 24, 30, 32, 55, 56], "dormann": 15, "dot": [61, 63], "doubl": 63, "doubletofloat": 63, "down": 61, "download": [13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 62, 63, 65], "download_dataset": 10, "download_namespace_metadata": 11, "driven": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "dt": 61, "dtype": [56, 60, 61, 63], "due": [56, 61], "dump": 58, "dure": [12, 13, 56, 61, 63], "dynam": 61, "e": [1, 7, 10, 12, 56, 63], "e731": 58, "each": [2, 4, 5, 6, 8, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 60, 61, 63, 65], "earlier": 58, "edit": [2, 5], "effect": [25, 29, 41, 54], "effici": 56, "element": [6, 13], "elif": 61, "elimin": 61, "ell": 63, "elliottow": 56, "els": [12, 56, 61, 63], "email": [2, 10, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "embed": 63, "empti": [11, 58, 61], "emptyenv": 58, "enabl": 58, "encapsul": 13, "encount": 58, "encourag": [13, 56], "end": [13, 56], "enerrio": 56, "enhanc": 56, "ensur": 63, "entri": 61, "entropi": 65, "entry_point": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "env": [2, 5, 7, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "env_id": 63, "env_nam": [2, 10, 13], "env_spec": [8, 13], "envid": 2, "environ": [2, 5, 6, 7, 8, 9, 10, 13, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 55, 56, 58, 60, 61, 65], "environment_st": 5, "envspec": [2, 8, 10, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "eol": 56, "ep": 12, "episod": [2, 3, 4, 6, 7, 8, 10, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "episode_0": 56, "episode_1": 56, "episode_2": 56, "episode_id": [12, 56], "episode_indic": [7, 8, 12], "episode_metadata_callback": [2, 4], "episode_reward": 63, "episodebuff": [7, 8, 10], "episodedata": [7, 12, 56], "episodemetadatacallback": [2, 13, 56], "episodes_gener": 12, "epoch": 65, "epsiodedata": 8, "equal": [2, 10, 13], "equat": 61, "equiv": 63, "equlival": 61, "ernestu": 15, "error": [10, 56, 58, 61, 63], "essenti": 63, "estim": [2, 10, 63], "et": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61, 63], "etc": 63, "euclidean": [43, 45, 47, 49], "evad": 61, "eval_env": [2, 7, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "eval_env_spec": [12, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53], "eval_interv": 63, "eval_reward_log": 63, "eval_td": 63, "evalu": [2, 7, 10, 12, 56, 63, 65], "evaluate_polici": 63, "everi": [1, 10, 12, 13, 21, 61, 63], "everyth": 63, "exampl": [2, 10, 11, 12, 13, 14, 56, 58, 61, 62, 63], "example_env": 63, "except": [8, 56, 58, 63], "excit": 56, "execut": 65, "exerpt": 56, "exist": [8, 11, 14, 56, 60, 61], "exit": 14, "expect": 60, "expectil": 63, "experienc": 56, "experiment": 11, "expert": [2, 10, 12, 13, 14, 15, 22, 25, 26, 29, 36, 37, 38, 41, 51, 54, 55, 56, 63, 65], "expert_polici": [2, 10], "expertpolici": [36, 65], "explain": [56, 61], "explicit": [56, 63], "explicitli": 56, "explor": 56, "exploration_act": 61, "explorationtyp": 63, "export": [12, 56], "extend": [12, 60], "extra": [2, 4, 5, 56, 61], "extract": 63, "extrapol": 63, "f": [12, 14, 56, 58, 60, 63, 65], "f01e2c": 14, "f4bf75": 14, "facilit": [10, 12, 56], "factor": 61, "factori": 3, "fail": [16, 17, 18, 19, 20, 21, 56], "fals": [2, 7, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 60, 61, 63, 65], "familiar": 63, "farama": [1, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 61, 63, 65], "favor": 56, "fc1": 65, "fc2": 65, "fc3": 65, "featur": [11, 12, 55, 56, 65], "fed000": 14, "few": 56, "ff00ff": [14, 55], "ffmpeg": 63, "field": [13, 56, 63], "fig": 63, "figsiz": 63, "figur": 63, "file": [2, 4, 11, 12, 13, 14, 55, 56, 60], "file_fold": 56, "filter": [7, 55, 56], "filter_dataset": [12, 56], "filter_episod": [7, 12, 56], "final": [6, 12, 15, 56, 58, 60, 61, 63], "final_scor": 63, "find": 60, "fine": [14, 23, 25, 27, 29, 39, 41, 52, 54], "first": [11, 12, 56, 58, 60, 61, 63], "fit": [60, 63], "fix": [21, 30, 42, 56, 63], "flag": [10, 56, 63], "flatten": 56, "flexibl": 12, "flip": [16, 17, 18, 19, 20, 21, 32], "float": [2, 8, 10, 13, 60, 63], "float32": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 61, 65], "float64": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 60, 63], "floppy_disk": 56, "folder": [1, 65], "follow": [2, 5, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 61, 63], "font": [14, 55], "forc": [10, 14, 30, 42, 61], "force_download": [10, 56], "form": [10, 13, 61], "format": [2, 8, 10, 12, 13, 56, 58], "formula": [10, 61], "forward": [11, 13, 63, 65], "found": [10, 13], "foundat": [1, 12, 14, 30, 56, 58, 61], "four": 65, "fourroom": [30, 37], "fourroomsenv": [35, 36], "fp": 63, "frac": 10, "frame": 63, "framework": 63, "franka_kitchen": [31, 33, 34], "frankakitchen": [30, 31, 32, 33, 34, 56], "from": [2, 5, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 60, 61, 63, 65], "from_pixel": 63, "froze": 56, "fu": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "full": [4, 8, 12, 36, 37, 56, 63], "fulli": 56, "function": [7, 8, 10, 12, 13, 14, 35, 36, 42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 61, 63, 65], "fundament": [15, 42, 61], "futur": [11, 12, 56, 61], "g": [12, 16, 17, 18, 19, 20, 21, 35, 36, 43, 44, 45, 46, 47, 48, 49, 50, 63], "gain": 61, "gamma": [61, 63], "gather": 63, "gcp": [12, 13, 55, 56], "gen_dataset_md": 56, "gener": [2, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 60, 61], "generate_path": 61, "get": [7, 8, 10, 12, 56, 58, 60, 61, 63, 65], "get_episod": 8, "get_episode_metadata": [8, 13], "get_namespace_metadata": 11, "get_next_st": 61, "get_normalized_scor": [2, 10, 56], "get_q_valu": 61, "get_siz": 8, "git": [1, 12], "github": [1, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61], "give": [12, 13, 14, 61, 63], "given": [12, 13, 14], "gleav": 15, "global": [2, 13, 61], "global_target_id": 61, "global_target_xi": 61, "glr": 56, "gmail": [16, 17, 18, 19, 20, 21, 35, 36], "go": [1, 61], "goal": [15, 16, 17, 18, 19, 20, 21, 32, 36, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 58, 60, 61, 63], "goal_cel": 61, "goe": [36, 37], "googl": [13, 56, 63], "gradient": 63, "grahamannett": 56, "greater": [12, 56], "green": [58, 63], "grid": 61, "gridworld": 37, "group": [2, 4, 10, 12, 13, 14, 30, 56, 61], "gt": 56, "guarante": 13, "gupta": 32, "gym": [2, 5, 7, 10, 12, 56, 58, 60, 61, 63, 65], "gymansium": 12, "gymenv": 63, "gymnaisum": 14, "gymnasium": [2, 5, 7, 8, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "gymnasium_robot": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "gynasium": 56, "h5py": 56, "ha": [12, 21, 42, 56, 61, 63], "hammer": [26, 27, 28, 30, 56], "hand": [13, 16, 18, 25, 29, 41, 54, 61, 63], "hand_dapg": [14, 25, 29, 30, 41, 54], "handl": [8, 12, 55], "hat": 63, "hausman": 32, "have": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 60, 61, 63, 65], "hdf5": [2, 4, 8, 13, 14, 55, 56, 60, 61], "help": [14, 56, 61], "helper": 63, "here": [63, 65], "hesit": 56, "hidden": 56, "hidden_s": 63, "hierarch": 12, "high": [25, 29, 41, 54, 56, 60, 61, 63], "higher": 61, "highli": 56, "hill": 15, "hing": [31, 33, 34], "hood": 63, "horizon": 32, "host": [12, 14, 25, 29, 30, 32, 41, 54, 55], "how": [1, 2, 56, 58, 60, 61, 63, 65], "howev": [13, 42, 56, 58, 61, 63, 65], "howuhh": 56, "href": 14, "html": 63, "http": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 65], "hub": 56, "human": [10, 12, 13, 14, 22, 25, 26, 29, 38, 41, 51, 54, 55, 56, 63, 65], "hyperparamet": 63, "hypothet": [2, 10], "i": [1, 2, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 32, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 60, 63, 65], "id": [2, 3, 6, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 61, 65], "idea": 56, "identifi": [2, 10, 11, 13], "ignor": [56, 63], "im": 56, "imag": [35, 36, 58, 63], "imit": [22, 25, 26, 29, 32, 38, 41, 51, 54], "implement": [14, 15, 61, 63], "implicit": [62, 66], "implicitli": 63, "import": [2, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63], "import_bugfix": 56, "improv": [56, 63], "imshow": 63, "in_kei": 63, "includ": [6, 13, 31, 32, 34, 42, 56, 63], "incompat": 14, "incorrect": [8, 56], "increas": 6, "indic": [2, 7, 8, 10, 12, 56], "inf": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 60], "infer": 63, "influenc": [61, 63], "info": [2, 3, 5, 6, 9, 12, 13, 56, 61, 65], "inform": [1, 2, 5, 7, 13, 56, 61], "infos_dataset": 56, "infos_subgroup": 56, "init": 56, "initi": [2, 6, 7, 12, 13, 56, 58, 60, 61, 63, 65], "initialis": 63, "input": [5, 7, 12, 13, 63, 65], "input_dim": 65, "insid": 58, "inspir": 61, "instabl": 61, "instal": [1, 10, 14, 55, 56, 58, 63, 65], "instanc": [7, 56], "instanti": 14, "instead": [12, 13, 56, 61, 63], "instruct": 56, "int": [2, 3, 6, 7, 8, 10, 13, 56, 61], "int64": [56, 65], "int_": [7, 61], "integ": 13, "intend": 7, "interact": 32, "interest": 63, "interfac": 12, "intern": [12, 56], "introduc": [15, 25, 29, 41, 54, 56, 63], "invers": 63, "involv": [30, 42, 61], "ipynb": [58, 60, 61, 63, 65], "ipython": 63, "iql": 63, "iql_torchrl": 63, "iqlloss": 63, "is_avail": 63, "is_shar": 63, "isinst": 65, "isol": 56, "issu": [56, 63], "item": [2, 61, 63, 65], "iter": [7, 8, 12, 13, 15, 42, 61, 63], "iterate_episod": [7, 12, 56], "its": [10, 56, 58, 61, 63], "itself": 12, "j": 61, "jamartinh": 56, "josephcarrino": 56, "journal": 15, "json": [13, 14, 56, 58], "jupyt": [58, 60, 61, 62, 63, 65], "just": [12, 58, 63], "justin": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "k": 32, "k_": 61, "k_d": 61, "k_i": 61, "k_p": 61, "kabuki": 56, "kaixin96": 56, "kanervisto": 15, "keep": [12, 56], "kei": [2, 5, 8, 10, 12, 14, 56, 60, 61, 63], "kept": 13, "kernel": 63, "kettl": [31, 32, 33, 34], "key_fil": 14, "key_path": 11, "kitchen": [30, 31, 33, 34, 56], "kitchenenv": [31, 33, 34], "kitsch": 56, "know": 61, "kostrikov": 63, "kumar": 32, "kwarg": [2, 5, 7, 11, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 60], "l": 63, "l2": 63, "l_": 63, "l_2": 63, "l_pi": 63, "l_q": 63, "l_v": 63, "lag": 63, "lambda": [7, 12, 56, 58, 61], "lambert": [15, 42, 61], "larg": [12, 15, 42, 56], "larger": [56, 61, 63], "largest": 56, "last": 56, "last_episode_id": 56, "later": [2, 10, 56, 63], "latest": [10, 14, 56, 61], "latest_vers": 10, "latter": [10, 13, 63], "layer": 63, "lazcano": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 51, 52, 53], "lazi": 63, "lazylinear": 63, "lead": [13, 16, 17, 18, 19, 20, 21, 61], "learn": [12, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 55, 56, 58, 60, 61, 62, 65, 66], "learnin": [15, 42, 61], "leav": 12, "left": [12, 61, 63], "leftarrow": [61, 63], "len": [61, 63], "length": [3, 65], "less": 61, "let": [58, 60, 61, 65], "level": 13, "levin": 32, "lib": 63, "librari": [12, 56, 58, 65], "light": [31, 32, 33, 34], "like": [11, 12, 14, 58, 63, 65], "limit": [61, 63], "linalg": 61, "line": [14, 60], "linear": 65, "link": [2, 10, 12, 13], "linux": 12, "list": [2, 3, 7, 8, 12, 13, 55, 56, 63, 65], "list_local_dataset": [10, 12, 56, 60], "list_local_namespac": 11, "list_remote_dataset": [10, 56], "list_remote_namespac": 11, "ll": [58, 60], "load": [2, 11, 13, 56, 58, 63, 65], "load_dataset": [2, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 65], "loc": 63, "local": [10, 13, 56, 58, 60, 63, 65], "local_dataset": 60, "locat": [12, 15, 16, 17, 18, 19, 20, 21, 30, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61, 63], "log": [56, 63, 65], "long": [32, 61], "longer": 56, "look": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58], "loop": [12, 63, 65], "loos": 56, "lose": 12, "loss": 65, "loss_actor": 63, "loss_dict": 63, "loss_fn": 65, "loss_funct": 63, "loss_log": 63, "loss_modul": 63, "loss_qvalu": 63, "loss_valu": 63, "lost": 56, "low": [56, 60, 61, 63], "lower": 13, "lr": 63, "lynch": 32, "m_": 63, "machin": [13, 15], "maco": 12, "made": [1, 56], "mai": [11, 12, 61, 63], "main": [2, 7, 56, 58, 61, 63], "main_data": [14, 55, 56], "major": 56, "make": [1, 2, 7, 12, 56, 58, 60, 61, 63, 65], "make_value_estim": 63, "manag": 56, "mandatori": [13, 56], "mani": 13, "manipul": [25, 29, 41, 54, 63], "manual_se": [63, 65], "map": [12, 16, 18, 61, 63], "map_length": 61, "map_width": 61, "margin": 63, "markdown": 56, "markovian": [15, 42], "master": 61, "match": 10, "mathbb": 63, "mathcal": 63, "matplotlib": 63, "matrix": 61, "max": [61, 63], "max_": [61, 63], "max_a": 63, "max_episode_step": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 61, 63], "max_step": 63, "maximilian": 15, "maximis": 63, "maximum": [2, 10, 13, 61, 63, 65], "maze": [16, 17, 18, 19, 20, 21, 30, 43, 44, 45, 46, 47, 48, 49, 50, 56, 61], "maze2d": [42, 61], "maze_map": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 61], "maze_solv": 61, "mb": [8, 12, 14, 55], "md": [1, 56], "mdp": [12, 56], "mean": [6, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 61, 63], "meant": [2, 56], "measur": [25, 29, 41, 54, 61], "medium": [12, 15, 42, 56], "memor": [15, 42], "memori": [2, 12, 56], "mention": [13, 56, 61, 65], "merg": 14, "messag": 14, "met": 7, "metadata": [2, 4, 7, 8, 10, 12, 14, 56, 60], "method": [12, 15, 42, 56, 58, 61, 63], "metric": 13, "mgoulao": 56, "microwav": [31, 32, 33, 34], "mimic": 15, "min": 63, "minari": [11, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 63, 65], "minari_autose": 2, "minari_data": 63, "minari_dataset": [56, 65], "minari_datasets_path": 13, "minari_remot": [12, 56], "minari_storag": 56, "minari_vers": [13, 56], "minaridataset": [2, 10, 12, 13, 56, 65], "minariexperiencereplai": 63, "minaristorag": [2, 7, 10, 13, 56], "minigrid": [30, 35, 36, 56, 58], "minim": 60, "minimis": 63, "minimum": [2, 10, 12, 13, 56], "minor": 56, "mirana": 60, "misc": 56, "miss": 56, "mission": [35, 36, 58], "mission_func": 58, "missionspac": [35, 36, 58], "missonspac": 58, "mix": [22, 25, 26, 29, 32, 38, 41, 51, 54, 56], "mlp": 63, "mode": 63, "modifi": [8, 12, 13, 56, 60], "modul": [58, 60, 61, 63, 65], "modulelist": 63, "moment": 13, "more": [1, 6, 12, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 61, 63], "more_dataset": 56, "moreov": [8, 13], "morpholog": 15, "most": [12, 14], "move": [12, 30, 32, 42, 54, 56, 61], "mp4": 63, "mujoco": [2, 10, 61], "multi": 63, "multipl": [10, 11, 12, 14, 56, 63], "must": [5, 7, 8, 10, 12, 13, 56, 63], "my": 12, "n": [7, 12, 13, 14, 61, 65], "n_episod": [7, 12], "n_step": [56, 61], "nail": 29, "name": [2, 10, 11, 12, 13, 14, 55, 56, 58, 65], "namespac": [2, 10, 56], "namespace_metadata": 13, "narrow": [25, 29, 41, 54], "nathan": [15, 42, 61], "navig": [15, 30, 37, 42], "ncol": 63, "ndarrai": [6, 7, 10, 13, 56], "necessari": 63, "need": [8, 12, 56, 58, 60, 61, 63, 65], "neg": [43, 45, 47, 49], "nest": [2, 5, 11, 13, 56], "net": 63, "network": [63, 65], "neural": 65, "never": [32, 33, 61, 63], "new": [2, 8, 10, 12, 16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 61, 63, 65], "new_dataset_id": [10, 56], "new_dataset_nam": 14, "newli": [10, 12, 63], "next": [9, 56, 61, 63, 65], "next_cel": 61, "next_episode_id": 56, "next_stat": 61, "nightli": 63, "nn": [63, 65], "no_grad": 63, "noah": 15, "nois": [43, 44, 45, 46, 47, 48, 49, 50, 56, 61], "non": [12, 13, 15, 42], "nondeterminist": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "none": [2, 3, 5, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61], "nonetyp": 56, "noqa": 58, "norm": 61, "normal": [2, 63], "normalized_scor": 10, "normalparamextractor": 63, "note": [10, 11, 13, 16, 17, 18, 19, 20, 21, 60, 61, 63], "notebook": [58, 60, 61, 62, 63, 65], "notic": 12, "notimplementederror": 58, "now": [10, 12, 56, 58, 60, 61, 65], "np": [7, 10, 13, 56, 60, 61, 63, 65], "npt": 7, "nrow": 63, "num_act": 61, "num_cel": 63, "num_episod": [58, 60], "num_episodes_average_scor": [2, 10], "num_epoch": 65, "num_eval_episod": 63, "num_itr": 61, "num_stat": 61, "num_step": 2, "number": [2, 6, 7, 10, 12, 13, 14, 56], "numpi": [60, 61, 63, 65], "o": 65, "ob": [2, 5, 12, 56, 61, 65], "object": [7, 8, 9, 12, 25, 29, 32, 37, 41, 54, 56, 58, 63, 65], "observ": [2, 3, 5, 6, 8, 9, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "observation_spac": [2, 8, 10, 12, 13, 56, 58, 60, 65], "observation_space_subset": 60, "obstyp": [2, 10], "obtain": [22, 25, 26, 29, 38, 41, 51, 54, 61], "occur": [16, 17, 18, 19, 20, 21], "off": 14, "offici": 56, "offlin": [12, 13, 14, 55, 56, 61, 63, 65], "often": 61, "oibserv": 56, "omar": [35, 36], "omit": 60, "onc": [1, 12, 61, 63, 65], "one": [2, 6, 7, 8, 12, 25, 29, 41, 42, 54, 56, 63], "one_hot": 65, "onli": [10, 11, 12, 13, 42, 44, 46, 47, 48, 50, 56, 60, 63], "onlin": 63, "onto": 11, "open": [25, 32, 42, 56, 63], "opengl": 63, "optim": [61, 65], "option": [2, 3, 5, 7, 8, 10, 12, 13, 14, 56], "order": [12, 31, 32, 56, 60], "order_enforc": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "org": [11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 65], "organ": 56, "orient": [5, 41, 60], "origin": [10, 12, 25, 29, 30, 32, 41, 42, 54, 56, 58, 63], "other": [7, 8, 10, 11, 12, 13, 14, 32, 34, 56, 60, 61, 63], "otherwis": [7, 12, 44, 46, 48, 50, 56], "our": [1, 12, 13, 56, 60, 61, 63, 65], "ourselv": 61, "out": [8, 12, 56, 58, 61, 63], "out_featur": 63, "out_kei": 63, "outlin": 60, "output": [8, 58, 60, 61, 63, 65], "output_dim": 65, "outsid": 63, "over": [2, 7, 10, 12, 61, 63], "overal": 63, "overconfid": 63, "overestim": 63, "overrid": [4, 5, 13, 14, 61], "overridden": [4, 5, 10, 56], "overridng": 61, "overshoot": 61, "overview": 63, "overwrit": 11, "own": [10, 12, 56, 61], "p_": 61, "packag": [1, 2, 10, 14, 56, 65], "pad": 65, "pad_sequ": 65, "page": 56, "page_facing_up": 56, "pair": [13, 63], "paper": [25, 29, 41, 54], "paramet": [2, 3, 4, 5, 7, 8, 10, 11, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 63, 65], "parameteris": 63, "part": 63, "partial": [32, 56], "particular": [58, 63], "pass": [2, 4, 7, 10, 12, 60, 63], "past": 56, "path": [8, 11, 12, 13, 14, 43, 44, 45, 46, 47, 48, 49, 50, 56, 61, 65], "path_str": 14, "pathlik": [7, 8], "pbar": 63, "pd": [42, 43, 44, 45, 46, 47, 48, 49, 50, 61], "pen": [14, 30, 38, 39, 40, 56], "per": [2, 56], "perceptron": 63, "perez": [43, 44, 45, 46, 47, 48, 49, 50, 61], "perform": [9, 10, 12, 14, 32, 33, 34, 61, 63, 65], "perimet": [42, 47, 48], "permalink": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "perman": 12, "pettingzoo": 56, "phi": 63, "pi": [61, 63], "pi_": 63, "pick": [16, 18], "pid": [56, 61], "pip": [1, 2, 10, 12, 13, 14, 55, 58, 63, 65], "pixel": 63, "pixels_onli": 63, "plai": [12, 15], "plan": [12, 56, 60], "planner": [15, 42], "platform": 13, "pleas": [11, 12, 56, 60], "plot": 63, "plt": 63, "plug": 63, "point": [7, 30, 56, 63], "point_maz": [43, 44, 45, 46, 47, 48, 49, 50], "point_maze_dataset": [56, 61], "pointmaz": [15, 30, 43, 44, 45, 46, 47, 48, 49, 50, 56, 59, 60, 62], "pointmaze_larg": [42, 44], "pointmaze_largedens": [42, 43], "pointmaze_medium": [42, 46, 61], "pointmaze_mediumdens": [42, 45], "pointmaze_open": [42, 48], "pointmaze_opendens": [42, 47], "pointmaze_umaz": [42, 50, 60], "pointmaze_umazedens": [42, 49], "pointmazeenv": [43, 44, 45, 46, 47, 48, 49, 50], "pointmazestepdatacallback": 61, "pole": 65, "polici": [2, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 29, 30, 32, 36, 37, 38, 39, 41, 42, 51, 52, 54, 61, 63], "policy_net": 65, "policynetwork": 65, "polyak": 63, "poorli": 63, "popul": 63, "popular": 55, "pose": [5, 61], "posit": [5, 32, 37, 54, 61, 63], "possibl": [13, 56], "ppo": 65, "pr": 56, "practic": 63, "pre": 56, "precis": 63, "precommit": 56, "predict": [61, 65], "prepend": 11, "preprint": 32, "prerequisit": 63, "present": [10, 15, 30, 65], "prevent": 12, "previou": [2, 12, 56], "previous": [15, 56, 61, 65], "principl": 30, "print": [12, 56, 58, 60, 63, 65], "prng": 2, "probabilisticactor": 63, "probabl": 61, "problem": 65, "proce": [14, 65], "procedur": 60, "process": [12, 56, 61, 63], "prod": 65, "produc": 56, "program": 61, "progress": 14, "project": [12, 56], "prompt": [12, 14], "properli": [58, 63], "properti": [7, 63], "proporti": 61, "provid": [10, 12, 13, 14, 15, 16, 18, 22, 23, 24, 25, 26, 27, 28, 29, 30, 38, 39, 40, 41, 51, 52, 53, 54, 55, 56, 63], "pseudo": 56, "psi": 63, "public": [13, 56, 61], "publicli": 55, "pure": 56, "purpos": [12, 30, 42, 61, 63], "py": [56, 58, 60, 61, 63, 65], "pyarrow": 56, "pypi": 56, "pyplot": 63, "pyright": 56, "pytest": 56, "python": [12, 55, 56, 58, 60, 61, 62, 63, 65], "python3": 63, "pytorch": [56, 62, 63, 66], "pytorchdataload": 56, "pyvirtualdisplai": 63, "pz": 56, "q": [61, 62, 66], "q_": 63, "q_fn": 61, "q_iter": 61, "q_net": 63, "q_valu": 61, "qiter": [15, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61], "qpo": 61, "quadrup": [15, 30], "quantifi": 63, "queri": 63, "quick": 63, "quickli": 61, "quit": 63, "qvalu": 63, "qvel": 61, "r": [1, 16, 17, 18, 19, 20, 21, 61, 63], "r_t": 63, "raffin": 15, "rais": [8, 10], "rajeswaran": [25, 29, 41, 54], "randn": 61, "random": [2, 7, 10, 12, 17, 19, 20, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 58, 60, 61, 63, 65], "random_polici": [58, 60], "randomis": 63, "randomli": [12, 13, 42, 58, 61], "randompolici": 35, "rang": [2, 10, 12, 56, 58, 60, 61, 63, 65], "rate": [16, 17, 18, 19, 20, 21, 61], "rather": 63, "ratio": [22, 25, 26, 29, 38, 41, 51, 54], "rb": 63, "re": [56, 61], "reach": [15, 16, 17, 18, 19, 20, 21, 32, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 61], "read": [8, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 63], "readabl": 13, "readi": 56, "readm": 56, "real": 15, "reason": 61, "rebuild": 1, "receiv": 65, "recent": [12, 63], "recommend": 12, "record": [2, 12, 56, 60, 61], "record_info": [2, 12, 13, 61], "recov": [2, 7, 10, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 63], "recover_env": 56, "recover_environ": [2, 7, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 65], "recoveri": 56, "redtachyon": 56, "reduc": [56, 61], "ref": 10, "ref_max_scor": [2, 10], "ref_min_scor": [2, 10], "refactor": [56, 61], "refer": [2, 10, 30, 56], "referenc": 56, "regener": 37, "regist": 58, "registr": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "registri": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "reinforc": [12, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 55, 61], "rel": 56, "relai": [30, 32], "releas": 11, "relev": [2, 10, 12], "reliabl": 15, "reloc": [30, 51, 52, 53, 56], "relu": [63, 65], "rememb": 63, "remot": [10, 11, 12, 13, 14, 55, 56], "remov": [12, 56], "remove_task_when_complet": [31, 33, 34], "renam": 56, "render": 63, "render_mod": 65, "reorgan": 56, "replac": [15, 30, 61], "replai": [12, 56], "replay_buff": 63, "repositori": [10, 13, 14, 23, 24, 25, 27, 28, 29, 30, 32, 39, 40, 41, 52, 53, 54], "repres": [13, 58, 63], "represent": 56, "reproduc": [2, 10, 12, 30, 37, 63, 65], "reproduct": [30, 56], "requir": [1, 2, 10, 12, 13, 14, 56, 58, 60, 61, 63, 65], "research": 15, "reset": [2, 12, 13, 16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 60, 61, 63, 65], "reset_target": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50], "resid": 11, "residu": 56, "respect": [10, 61, 63], "respond": 61, "respons": 12, "rest": 63, "restart": 63, "result": [10, 56, 58, 61], "results_video": 63, "retriev": [10, 12, 56], "return": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 44, 46, 48, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "rew": [2, 5, 12, 56, 61, 65], "rew_matrix": 61, "reward": [3, 5, 6, 12, 13, 15, 16, 17, 18, 19, 20, 21, 25, 29, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 56, 63, 65], "reward_funct": 61, "reward_threshold": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "reward_typ": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "rewards_max": 13, "rewards_mean": 13, "rewards_min": 13, "rewards_std": 13, "rewards_sum": 13, "right": [56, 61, 63], "rl": [12, 14, 23, 25, 27, 29, 39, 41, 52, 54, 56, 63, 65], "rl_zoo3": [56, 65], "rm": 63, "rnd": 56, "rnn": 65, "robot": [14, 15, 25, 29, 30, 41, 54, 56, 60, 61, 63], "rodrigo": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 61], "rodrigodelazcano": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "roll": 63, "rollout": 63, "root": [12, 13], "row": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "rperezvicent": [14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 61], "rugged": 56, "run": [12, 22, 25, 26, 29, 38, 41, 51, 54, 56, 63], "s_": 63, "s_t": 63, "sac": [15, 16, 17, 18, 19, 20, 21], "safe": 56, "same": [2, 7, 10, 12, 13, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56, 61, 63], "sampl": [2, 7, 13, 35, 37, 55, 56, 58, 60, 63], "sample_episod": [7, 12, 13, 56], "sampled_episod": 13, "sampler": 63, "samplerwithoutreplac": 63, "save": [4, 13, 56, 58, 60, 61, 63, 65], "save_video": 63, "scale": 63, "scale_lb": 63, "scenario": 65, "schedul": [12, 56], "score": [2, 63], "script": [14, 30, 63, 65], "second": [12, 56], "section": [13, 56, 63], "see": [13, 58, 63], "seed": [2, 3, 7, 10, 12, 13, 56, 58, 60, 61, 63, 65], "seen": 61, "select": [16, 17, 18, 19, 20, 25, 29, 41, 42, 54, 56, 61], "self": [2, 3, 4, 5, 7, 8, 60, 61, 65], "separ": 56, "sequenc": [32, 33, 34, 42], "sequenti": 63, "seri": [12, 61], "serial": [13, 56, 59, 62], "serializ": 13, "serialize_custom_spac": 58, "serialize_spac": 58, "serv": 12, "server": [10, 11, 12, 14, 55, 63], "servic": 56, "set": [2, 7, 10, 12, 13, 15, 16, 17, 18, 19, 20, 21, 56, 61, 63, 65], "set_descript": 63, "set_exploration_typ": 63, "set_se": [7, 12, 63], "set_titl": 63, "set_xlabel": 63, "setpoint": 61, "sever": 13, "shape": [15, 20, 21, 42, 49, 50, 56, 60, 61, 63, 65], "shard": 12, "share": [56, 63], "shift": [13, 63], "should": [2, 58, 60], "show": [12, 55, 56, 58, 60, 63], "shown": [14, 63], "shreyansjainn": 56, "shuffl": 65, "sim": 63, "similarli": [56, 63], "simpl": [12, 56, 61, 63, 65], "simplefilt": 63, "simpli": [58, 61], "sinc": [58, 61, 65], "singl": [3, 6, 9, 10, 12, 14, 56, 63], "size": [8, 10, 12, 14, 55, 56, 61, 63], "skip": [10, 63], "slash": [11, 13], "slice": [7, 8], "slide": [31, 32, 33, 34], "slightli": 56, "slowli": [61, 63], "small": [56, 63], "smaller": [42, 56, 61], "snippet": 12, "so": [12, 13, 61, 63], "soft": 63, "softupd": 63, "solut": 61, "solv": [32, 61], "solver": 61, "some": [2, 8, 12, 14, 56, 58, 61, 63], "sourc": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 56, 58, 60, 61, 62, 63, 65], "space": [2, 8, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 59, 61, 62, 63, 65], "space_dict": 58, "spars": [15, 16, 17, 18, 19, 20, 21, 25, 29, 41, 42, 44, 46, 48, 50, 54], "spec": [2, 7, 10, 13, 14, 56, 58, 63], "specif": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 60, 61, 63], "specifi": [2, 7, 8, 12, 13, 56, 63], "speed": [56, 61], "sphinx": 1, "sphinx_github_changelog_token": 56, "sphx": 56, "split": [42, 56], "split_dataset": [10, 12, 56], "split_traj": 63, "squar": 58, "src": 63, "stabil": 61, "stabl": 15, "stable_baselines3": 65, "stack": [6, 13, 56], "stand": [16, 17, 18, 19, 20, 21], "standard": [12, 56, 63], "start": [12, 13, 58, 60, 61, 63, 65], "state": [2, 32, 42, 61, 63], "state_action_valu": 63, "state_to_cel": 61, "state_valu": 63, "statist": 4, "steadi": 61, "step": [2, 3, 5, 6, 7, 8, 9, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "step_data": [3, 5, 60, 61], "step_data_callback": [2, 60, 61], "step_data_kei": 5, "stepdata": [3, 5], "stepdatacallback": [2, 13, 56, 59, 62], "stitch": 15, "storag": [8, 12, 13, 56], "store": [2, 8, 10, 12, 13, 56, 60, 63], "str": [2, 5, 8, 9, 10, 11, 13, 58], "straight": [36, 37], "strictli": 63, "string": [11, 13, 58], "stronger": 61, "structur": [11, 12, 56], "style": [2, 10, 13, 56, 63], "sub": [14, 56], "subcomponent_1": 56, "subcomponent_2": 56, "subdirectori": 13, "subgroup": [56, 61], "subplot": 63, "subsequ": 56, "subset": [56, 59, 62], "subtask": [31, 32, 33, 34], "subtrajectori": [32, 34], "succ": 61, "success": [16, 17, 18, 19, 20, 21, 61, 65], "successfulli": [14, 60], "sudo": 63, "suggest": 56, "sum": 63, "sum_": 61, "summari": 63, "super": [5, 60, 61, 65], "support": [2, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61, 63], "supportsfloat": 2, "suppos": 12, "sure": [14, 56], "surrog": 13, "switch": [31, 32, 33, 34], "sy": 65, "syntax": [2, 10, 13], "system": 61, "t": [2, 8, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56, 58, 60, 61, 63], "tabl": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "tackl": 63, "take": [7, 13, 58, 61], "taken": [6, 8, 43, 44, 45, 46, 47, 48, 49, 50, 60], "tanh": 63, "tanh_loc": 63, "tanhnorm": 63, "target": [16, 17, 18, 19, 20, 21, 30, 31, 32, 33, 34, 42, 54, 61, 63], "target_net_updat": 63, "task": [10, 12, 15, 25, 29, 32, 34, 41, 43, 44, 45, 46, 47, 48, 49, 50, 54, 61, 63, 65], "tasks_to_complet": [31, 33, 34], "tau": [61, 63], "td": 63, "team": 11, "temperatur": 63, "templat": 56, "tempor": 63, "temporari": [2, 12, 56, 61], "tensor": [63, 65], "tensordict": 63, "tensordictmodul": 63, "termin": [2, 3, 5, 6, 7, 9, 12, 13, 16, 17, 18, 19, 20, 21, 42, 56, 58, 60, 61, 63, 65], "terminate_on_tasks_complet": [31, 33, 34], "test": [10, 11, 12, 15, 56, 60], "text": [13, 35, 36, 56, 61], "than": [10, 12, 16, 17, 18, 19, 20, 21, 56, 63], "thank": 56, "thei": [8, 13, 30, 56, 63], "them": [12, 13, 56, 65], "theme": 61, "theori": 61, "therefor": 63, "theta": 63, "thi": [1, 2, 4, 5, 6, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 60, 61, 63, 65], "thing": [56, 58], "think": 61, "thorough": 56, "those": 63, "thought": 56, "three": [25, 29, 41, 54, 61, 63], "through": [12, 13, 14, 55, 56, 61, 63], "thu": [42, 61], "tight_layout": 63, "time": [1, 2, 10, 61], "timestep": 56, "to_str": 58, "togeth": [10, 12, 14, 32, 33, 63], "tohsin": 56, "tomekst": 56, "tool": [14, 29, 56], "top": [13, 14, 31, 33, 34], "torch": [63, 65], "torchrl": [62, 66], "total": [7, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 61, 63], "total_episod": [7, 8, 12, 13, 56, 65], "total_step": [7, 8, 12, 13, 56, 61], "total_timestep": 56, "touch": [11, 60], "toward": 61, "towardsdatasci": [15, 42, 61], "tqdm": [63, 65], "train": [15, 16, 17, 18, 19, 20, 21, 22, 25, 26, 29, 38, 41, 51, 54, 60], "trainer": 63, "trajectori": [14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 29, 39, 41, 42, 52, 54, 55, 56, 61], "transform": 63, "transformedenv": 63, "transit": [5, 56, 61, 63], "transition_matrix": 61, "tri": 63, "true": [2, 7, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61, 63, 65], "truncat": [2, 3, 5, 6, 9, 12, 13, 42, 56, 58, 60, 61, 63, 65], "try": [58, 63], "tune": [14, 23, 25, 27, 29, 39, 41, 52, 54, 61, 63], "tupl": [2, 3, 13, 56, 61, 63], "tutori": [56, 58, 60, 61, 63, 65], "tutorials_jupyt": 62, "tutorials_python": 62, "two": [10, 12, 13, 14, 25, 29, 41, 42, 54, 56, 63, 65], "txt": 1, "type": [2, 12, 13, 25, 29, 41, 54, 56, 58, 63, 65], "typer": 14, "typic": 61, "typing_extens": 56, "typo": 56, "u": [14, 15, 20, 21, 42, 49, 50, 56, 63, 65], "uint8": [35, 36, 58, 63], "umaz": [15, 42, 56, 61], "under": [10, 13, 42, 56, 63], "undiscount": [10, 13], "unflatten": 56, "unifi": 56, "uniform": 61, "union": [7, 58], "uniqu": 58, "unknown": 56, "unless": 2, "unlik": 63, "until": [12, 43, 44, 45, 46, 47, 48, 49, 50], "up": [12, 16, 17, 18, 19, 20, 21, 56, 58, 60, 61, 63, 65], "updat": [2, 8, 12, 56, 61, 63], "update_dataset_from_buff": 7, "update_dataset_from_collector_env": 56, "update_episod": 8, "update_episode_metadata": 8, "update_from_storag": 8, "update_metadata": 8, "upgrad": 63, "upload": 56, "upload_namespac": 11, "upon": 15, "upper": 13, "us": [2, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "usag": [14, 56], "user": [2, 12, 13, 56], "usual": 63, "util": [10, 12, 55, 63, 65], "v": [2, 10, 13, 14, 32, 63], "v0": [10, 11, 12, 13, 35, 36, 37, 58, 60, 61, 65], "v1": [10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 39, 40, 41, 51, 52, 53, 54, 56, 63, 65], "v1_1": 65, "v2": [12, 13, 14, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 63], "v3": [42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 60, 61], "v4": [15, 16, 17, 18, 19, 20, 21], "v_": [61, 63], "v_fn": 61, "valid": [10, 60, 61, 63], "valu": [2, 5, 6, 8, 9, 10, 12, 13, 44, 46, 48, 50, 56, 61, 63], "value_net": 63, "value_network": 63, "valueerror": 8, "valueoper": 63, "vari": [58, 63, 65], "variabl": [12, 13, 56, 61], "varianc": [43, 44, 45, 46, 47, 48, 49, 50, 61], "variat": 61, "varieti": 12, "variou": [32, 33, 58], "ve": 61, "vector_entry_point": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "veloc": [5, 42, 61], "veri": 12, "version": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 60, 61], "via": [32, 63], "vicent": [43, 44, 45, 46, 47, 48, 49, 50, 61], "video": 63, "video_fold": 63, "viewer_env": 63, "virtual": 63, "virtual_displai": 63, "visibl": 63, "visual": 65, "visualis": 63, "vol": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "wa": [2, 7, 10, 13, 15, 25, 29, 35, 36, 37, 41, 54, 56, 58], "wai": [12, 61, 63], "wall": [42, 47, 48, 61], "want": [7, 12, 14, 61], "wapoint": 61, "warn": [14, 56, 63], "waypoint": [15, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50], "waypoint_control": 61, "waypoint_target": 61, "waypoint_threshold": 61, "waypointcontrol": 61, "wd": 56, "we": [12, 13, 30, 37, 56, 58, 60, 61, 63, 65], "weight": 63, "well": [12, 13, 14, 55, 56, 61, 63], "were": [10, 12, 14, 25, 29, 30, 32, 41, 42, 54, 56], "what": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61], "when": [7, 12, 13, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 60, 61, 63], "where": [2, 8, 10, 13, 32, 34, 56, 61, 63], "whether": 11, "which": [2, 7, 8, 10, 12, 13, 15, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 60, 61, 63, 65], "while": [12, 56, 58, 60, 61, 63, 65], "who": 63, "whose": 63, "willdudlei": 56, "window": 56, "within": [7, 56, 63], "without": [43, 44, 45, 46, 47, 48, 49, 50, 56], "won": [12, 61], "work": [2, 12, 14, 56, 63], "workflow": 56, "world": 15, "worri": 58, "would": [11, 13, 14, 60, 61], "wrap": [2, 12, 56, 61, 63], "wrapper": [2, 4, 12, 13, 56, 58, 61, 63, 65], "write": [8, 63], "written": 63, "x": [7, 30, 42, 61, 65], "xvfb": 63, "xy": 61, "y": [14, 30, 42, 61, 63], "yml": 56, "you": [7, 8, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "youni": [35, 36], "younik": 56, "younis98": 36, "your": [12, 14, 56, 65], "zero": 61, "zero_grad": [63, 65], "zip": 62, "zoo": 65, "\u898b\u7fd2\u3044": 55}, "titles": ["404 - Page Not Found", "Minari documentation", "DataCollector", "EpisodeBuffer", "EpisodeMetadataCallback", "StepDataCallback", "EpisodeData", "MinariDataset", "MinariStorage", "StepData", "Minari", "Namespace", "Basic Usage", "Dataset Standards", "Minari CLI", "Ant Maze", "Large-Diverse", "Large-Play", "Medium-Diverse", "Medium-Play", "Umaze-Diverse", "Umaze", "Cloned", "Expert", "Human", "Door", "Cloned", "Expert", "Human", "Hammer", "D4RL", "Complete", "Kitchen", "Mixed", "Partial", "Fourrooms-Random", "Fourrooms", "MiniGrid", "Cloned", "Expert", "Human", "Pen", "Point Maze", "Large-Dense", "Large", "Medium-Dense", "Medium", "Open-Dense", "Open", "Umaze-Dense", "Umaze", "Cloned", "Expert", "Human", "Relocate", "<no title>", "Release Notes", "Dataset Creation", "Serializing a custom space", "Dataset Creation", "Collecting a subset of a dictionary space with StepDataCallback", "PointMaze D4RL dataset", "Tutorials", "Implicit Q-Learning with TorchRL", "Using Datasets", "Behavioral cloning with PyTorch", "Using Datasets"], "titleterms": {"0": 56, "1": [56, 61], "2": [56, 61], "3": [56, 61], "4": 56, "404": 0, "5": 56, "For": 63, "Not": 0, "The": [0, 63], "action": 13, "adroit": 63, "ant": 15, "attribut": [3, 6, 7, 8, 9], "basic": 12, "behavior": 65, "buffer": 63, "build": [1, 63], "checkpoint": 12, "cli": 14, "clone": [22, 26, 38, 51, 65], "collect": [12, 60, 61], "combin": [10, 12, 14], "complet": 31, "content": [15, 25, 29, 30, 32, 37, 41, 42, 54], "control": 61, "could": 0, "creat": [10, 11, 12, 61], "creation": [57, 59, 62], "custom": 58, "d": 61, "d4rl": [30, 61], "data": [12, 61], "data_collector": 3, "datacollector": 2, "dataset": [8, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 57, 59, 61, 62, 64, 65, 66], "defin": 63, "delet": [10, 11, 14], "dens": [43, 45, 47, 49], "deriv": 61, "descript": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "detail": 14, "dictionari": 60, "directori": 13, "divers": [16, 18, 20], "document": 1, "door": 25, "download": [10, 11, 12, 14], "environ": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 63], "episod": 12, "episodebuff": 3, "episodedata": [6, 13], "episodemetadatacallback": 4, "evalu": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "expert": [23, 27, 39, 52], "filter": 12, "found": 0, "fourroom": [35, 36], "gener": 65, "get": 11, "hammer": 29, "headless": 63, "human": [24, 28, 40, 53], "i": 61, "implicit": 63, "import": 65, "instal": 12, "integr": 61, "kitchen": 32, "larg": [16, 17, 43, 44], "learn": 63, "list": [10, 11, 14], "load": [10, 12], "local": [11, 12, 14], "loss": 63, "maze": [15, 42], "medium": [18, 19, 45, 46], "metadata": [11, 13], "method": [2, 3, 4, 5, 7, 8], "minari": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 61], "minari_storag": 8, "minaridataset": 7, "minaristorag": 8, "minigrid": 37, "mix": 33, "model": 63, "modifi": 61, "namespac": [11, 12, 13], "normal": 10, "note": 56, "observ": 13, "open": [47, 48], "optim": 63, "p": 61, "page": 0, "partial": 34, "pen": [41, 63], "plai": [17, 19], "planner": 61, "point": 42, "pointmaz": 61, "polici": 65, "pre": 63, "proport": 61, "pytorch": 65, "q": 63, "random": 35, "recov": 12, "refer": [15, 25, 29, 32, 37, 41, 42, 54, 61], "releas": 56, "reloc": 54, "replai": 63, "request": 0, "requisit": 63, "result": 63, "sampl": 12, "save": 12, "score": 10, "serial": 58, "show": 14, "space": [13, 58, 60], "spec": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "split": [10, 12], "standard": 13, "stepdata": 9, "stepdatacallback": [5, 60, 61], "structur": 13, "subset": 60, "support": 13, "term": 61, "torchrl": 63, "train": [63, 65], "tutori": 62, "umaz": [20, 21, 49, 50], "updat": 11, "upload": [11, 14], "us": [12, 62, 64, 66], "usag": 12, "v0": 56, "waypoint": 61}}) \ No newline at end of file +Search.setIndex({"alltitles": {"0.1.0": [[56, "release-0-1-0"]], "0.2.2": [[56, "release-0-2-2"]], "1. Proportional Term (P)": [[61, "proportional-term-p"]], "2. Derivative Term (D)": [[61, "derivative-term-d"]], "3. Integral Term (I)": [[61, "integral-term-i"]], "404 - Page Not Found": [[0, null]], "Ant Maze": [[15, null]], "Attributes": [[3, "attributes"], [6, "attributes"], [7, "attributes"], [8, "attributes"], [9, "attributes"]], "Basic Usage": [[12, null]], "Behavioral cloning with PyTorch": [[65, null], [65, "id1"]], "Build the Documentation": [[1, "build-the-documentation"]], "Building a replay buffer": [[63, "building-a-replay-buffer"]], "Checkpoint Minari Dataset": [[12, "checkpoint-minari-dataset"]], "Cloned": [[22, null], [26, null], [38, null], [51, null]], "Collect Data and Create Minari Dataset": [[61, "collect-data-and-create-minari-dataset"]], "Collecting Data": [[12, "collecting-data"]], "Collecting a subset of a dictionary space with StepDataCallback": [[60, null]], "Combine Minari Datasets": [[10, "combine-minari-datasets"], [12, "combine-minari-datasets"]], "Combine datasets": [[14, "combine-datasets"]], "Complete": [[31, null]], "Content": [[15, "content"], [25, "content"], [29, "content"], [30, "content"], [32, "content"], [37, "content"], [41, "content"], [42, "content"], [54, "content"]], "Create Minari Dataset": [[10, "create-minari-dataset"], [12, "create-minari-dataset"]], "Create Namespace": [[11, "create-namespace"]], "D4RL": [[30, null]], "DataCollector": [[2, null]], "Dataset Creation": [[57, null], [59, null], [62, "dataset-creation"]], "Dataset Metadata": [[13, "dataset-metadata"]], "Dataset Specs": [[16, "dataset-specs"], [17, "dataset-specs"], [18, "dataset-specs"], [19, "dataset-specs"], [20, "dataset-specs"], [21, "dataset-specs"], [22, "dataset-specs"], [23, "dataset-specs"], [24, "dataset-specs"], [26, "dataset-specs"], [27, "dataset-specs"], [28, "dataset-specs"], [31, "dataset-specs"], [33, "dataset-specs"], [34, "dataset-specs"], [35, "dataset-specs"], [36, "dataset-specs"], [38, "dataset-specs"], [39, "dataset-specs"], [40, "dataset-specs"], [43, "dataset-specs"], [44, "dataset-specs"], [45, "dataset-specs"], [46, "dataset-specs"], [47, "dataset-specs"], [48, "dataset-specs"], [49, "dataset-specs"], [50, "dataset-specs"], [51, "dataset-specs"], [52, "dataset-specs"], [53, "dataset-specs"]], "Dataset Standards": [[13, null]], "Dataset generation": [[65, "dataset-generation"]], "Defining the model": [[63, "defining-the-model"]], "Delete Minari Datasets": [[10, "delete-minari-datasets"]], "Delete Namespace": [[11, "delete-namespace"]], "Delete local datasets": [[14, "delete-local-datasets"]], "Description": [[16, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [21, "description"], [22, "description"], [23, "description"], [24, "description"], [26, "description"], [27, "description"], [28, "description"], [31, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [38, "description"], [39, "description"], [40, "description"], [43, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"]], "Door": [[25, null]], "Download Datasets": [[12, "download-datasets"]], "Download Minari Dataset": [[10, "download-minari-dataset"]], "Download Namespace Metadata": [[11, "download-namespace-metadata"]], "Download datasets": [[14, "download-datasets"]], "Environment Specs": [[16, "environment-specs"], [17, "environment-specs"], [18, "environment-specs"], [19, "environment-specs"], [20, "environment-specs"], [21, "environment-specs"], [22, "environment-specs"], [23, "environment-specs"], [24, "environment-specs"], [26, "environment-specs"], [27, "environment-specs"], [28, "environment-specs"], [31, "environment-specs"], [33, "environment-specs"], [34, "environment-specs"], [35, "environment-specs"], [36, "environment-specs"], [38, "environment-specs"], [39, "environment-specs"], [40, "environment-specs"], [43, "environment-specs"], [44, "environment-specs"], [45, "environment-specs"], [46, "environment-specs"], [47, "environment-specs"], [48, "environment-specs"], [49, "environment-specs"], [50, "environment-specs"], [51, "environment-specs"], [52, "environment-specs"], [53, "environment-specs"]], "EpisodeBuffer": [[3, null]], "EpisodeData": [[6, null]], "EpisodeData Structure": [[13, "episodedata-structure"]], "EpisodeMetadataCallback": [[4, null]], "Evaluation Environment Specs": [[16, "evaluation-environment-specs"], [17, "evaluation-environment-specs"], [18, "evaluation-environment-specs"], [19, "evaluation-environment-specs"], [20, "evaluation-environment-specs"], [21, "evaluation-environment-specs"], [22, "evaluation-environment-specs"], [23, "evaluation-environment-specs"], [24, "evaluation-environment-specs"], [26, "evaluation-environment-specs"], [27, "evaluation-environment-specs"], [28, "evaluation-environment-specs"], [31, "evaluation-environment-specs"], [33, "evaluation-environment-specs"], [34, "evaluation-environment-specs"], [35, "evaluation-environment-specs"], [36, "evaluation-environment-specs"], [38, "evaluation-environment-specs"], [39, "evaluation-environment-specs"], [40, "evaluation-environment-specs"], [43, "evaluation-environment-specs"], [44, "evaluation-environment-specs"], [45, "evaluation-environment-specs"], [46, "evaluation-environment-specs"], [47, "evaluation-environment-specs"], [48, "evaluation-environment-specs"], [49, "evaluation-environment-specs"], [50, "evaluation-environment-specs"], [51, "evaluation-environment-specs"], [52, "evaluation-environment-specs"], [53, "evaluation-environment-specs"]], "Expert": [[23, null], [27, null], [39, null], [52, null]], "Filter Episodes": [[12, "filter-episodes"]], "For headless environments": [[63, "for-headless-environments"]], "Fourrooms": [[36, null]], "Fourrooms-Random": [[35, null]], "Get Local Namespace Metadata": [[11, "get-local-namespace-metadata"]], "Hammer": [[29, null]], "Human": [[24, null], [28, null], [40, null], [53, null]], "Implicit Q-Learning": [[63, "implicit-q-learning"]], "Implicit Q-Learning with TorchRL": [[63, null]], "Imports": [[65, "imports"]], "Installation": [[12, "installation"]], "Kitchen": [[32, null]], "Large": [[44, null]], "Large-Dense": [[43, null]], "Large-Diverse": [[16, null]], "Large-Play": [[17, null]], "List Minari Datasets": [[10, "list-minari-datasets"]], "List Namespaces": [[11, "list-namespaces"]], "List datasets": [[14, "list-datasets"]], "Load Local Datasets": [[12, "load-local-datasets"]], "Load Minari Dataset": [[10, "load-minari-dataset"]], "Loss and optimizer": [[63, "loss-and-optimizer"]], "Medium": [[46, null]], "Medium-Dense": [[45, null]], "Medium-Diverse": [[18, null]], "Medium-Play": [[19, null]], "Methods": [[2, "methods"], [3, "methods"], [4, "methods"], [5, "methods"], [7, "methods"], [8, "methods"]], "Minari": [[10, null]], "Minari CLI": [[14, null]], "Minari Dataset Directory": [[13, "minari-dataset-directory"]], "Minari documentation": [[1, null]], "MinariDataset": [[7, null]], "MinariStorage": [[8, null]], "MiniGrid": [[37, null]], "Mixed": [[33, null]], "Modified StepDataCallback": [[61, "modified-stepdatacallback"]], "Namespace": [[11, null]], "Namespace metadata": [[13, "namespace-metadata"]], "Normalize Score": [[10, "normalize-score"]], "Observation and Action Spaces": [[13, "observation-and-action-spaces"]], "Open": [[48, null]], "Open-Dense": [[47, null]], "Partial": [[34, null]], "Pen": [[41, null]], "Point Maze": [[42, null]], "PointMaze D4RL dataset": [[61, null]], "Policy training": [[65, "policy-training"]], "Pre-requisites": [[63, "pre-requisites"]], "Recover Environment": [[12, "recover-environment"]], "References": [[15, "references"], [25, "references"], [29, "references"], [32, "references"], [37, "references"], [41, "references"], [42, "references"], [54, "references"], [61, "references"]], "Release Notes": [[56, null]], "Relocate": [[54, null]], "Results": [[63, "results"]], "Sampling Episodes": [[12, "sampling-episodes"]], "Save Dataset": [[12, "save-dataset"]], "Serializing a custom space": [[58, null]], "Show datasets details": [[14, "show-datasets-details"]], "Split Dataset": [[12, "split-dataset"]], "Split Minari Dataset": [[10, "split-minari-dataset"]], "StepData": [[9, null]], "StepDataCallback": [[5, null]], "Supported Spaces": [[13, "supported-spaces"]], "The Adroit Pen environment": [[63, "the-adroit-pen-environment"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Training": [[63, "training"]], "Tutorials": [[62, null]], "Umaze": [[21, null], [50, null]], "Umaze-Dense": [[49, null]], "Umaze-Diverse": [[20, null]], "Update Namespace": [[11, "update-namespace"]], "Upload Namespace": [[11, "upload-namespace"]], "Upload datasets": [[14, "upload-datasets"]], "Using Datasets": [[62, "using-datasets"], [64, null], [66, null]], "Using Minari Datasets": [[12, "using-minari-datasets"]], "Using Namespaces": [[12, "using-namespaces"]], "WayPoint Planner": [[61, "waypoint-planner"]], "Waypoint Controller": [[61, "waypoint-controller"]], "minari.DataCollector": [[2, "minari-datacollector"]], "minari.EpisodeData": [[6, "minari-episodedata"]], "minari.EpisodeMetadataCallback": [[4, "minari-episodemetadatacallback"]], "minari.MinariDataset": [[7, "minari-minaridataset"]], "minari.StepData": [[9, "minari-stepdata"]], "minari.StepDataCallback": [[5, "minari-stepdatacallback"]], "minari.data_collector.EpisodeBuffer": [[3, "minari-data-collector-episodebuffer"]], "minari.dataset.minari_storage.MinariStorage": [[8, "minari-dataset-minari-storage-minaristorage"]], "v0.3.0": [[56, "release-v0-3-0"]], "v0.3.1": [[56, "release-v0-3-1"]], "v0.4.0": [[56, "release-v0-4-0"]], "v0.4.1": [[56, "release-v0-4-1"]], "v0.4.2": [[56, "release-v0-4-2"]], "v0.4.3": [[56, "release-v0-4-3"]], "v0.5.0": [[56, "release-v0-5-0"]], "v0.5.1": [[56, "release-v0-5-1"]]}, "docnames": ["404", "README", "api/data_collector", "api/data_collector/episode_buffer", "api/data_collector/episode_metadata_callback", "api/data_collector/step_data_callback", "api/minari_dataset/episode_data", "api/minari_dataset/minari_dataset", "api/minari_dataset/minari_storage", "api/minari_dataset/step_data", "api/minari_functions", "api/namespace/namespace", "content/basic_usage", "content/dataset_standards", "content/minari_cli", "datasets/D4RL/antmaze/index", "datasets/D4RL/antmaze/large-diverse-v1", "datasets/D4RL/antmaze/large-play-v1", "datasets/D4RL/antmaze/medium-diverse-v1", "datasets/D4RL/antmaze/medium-play-v1", "datasets/D4RL/antmaze/umaze-diverse-v1", "datasets/D4RL/antmaze/umaze-v1", "datasets/D4RL/door/cloned-v2", "datasets/D4RL/door/expert-v2", "datasets/D4RL/door/human-v2", "datasets/D4RL/door/index", "datasets/D4RL/hammer/cloned-v2", "datasets/D4RL/hammer/expert-v2", "datasets/D4RL/hammer/human-v2", "datasets/D4RL/hammer/index", "datasets/D4RL/index", "datasets/D4RL/kitchen/complete-v2", "datasets/D4RL/kitchen/index", "datasets/D4RL/kitchen/mixed-v2", "datasets/D4RL/kitchen/partial-v2", "datasets/D4RL/minigrid/fourrooms-random-v0", "datasets/D4RL/minigrid/fourrooms-v0", "datasets/D4RL/minigrid/index", "datasets/D4RL/pen/cloned-v2", "datasets/D4RL/pen/expert-v2", "datasets/D4RL/pen/human-v2", "datasets/D4RL/pen/index", "datasets/D4RL/pointmaze/index", "datasets/D4RL/pointmaze/large-dense-v2", "datasets/D4RL/pointmaze/large-v2", "datasets/D4RL/pointmaze/medium-dense-v2", "datasets/D4RL/pointmaze/medium-v2", "datasets/D4RL/pointmaze/open-dense-v2", "datasets/D4RL/pointmaze/open-v2", "datasets/D4RL/pointmaze/umaze-dense-v2", "datasets/D4RL/pointmaze/umaze-v2", "datasets/D4RL/relocate/cloned-v2", "datasets/D4RL/relocate/expert-v2", "datasets/D4RL/relocate/human-v2", "datasets/D4RL/relocate/index", "index", "release_notes/index", "tutorials/dataset_creation/README", "tutorials/dataset_creation/custom_space_serialization", "tutorials/dataset_creation/index", "tutorials/dataset_creation/observation_space_subseting", "tutorials/dataset_creation/point_maze_dataset", "tutorials/index", "tutorials/using_datasets/IQL_torchrl", "tutorials/using_datasets/README", "tutorials/using_datasets/behavioral_cloning", "tutorials/using_datasets/index"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/data_collector.md", "api/data_collector/episode_buffer.md", "api/data_collector/episode_metadata_callback.md", "api/data_collector/step_data_callback.md", "api/minari_dataset/episode_data.md", "api/minari_dataset/minari_dataset.md", "api/minari_dataset/minari_storage.md", "api/minari_dataset/step_data.md", "api/minari_functions.md", "api/namespace/namespace.md", "content/basic_usage.md", "content/dataset_standards.md", "content/minari_cli.md", "datasets/D4RL/antmaze/index.md", "datasets/D4RL/antmaze/large-diverse-v1.md", "datasets/D4RL/antmaze/large-play-v1.md", "datasets/D4RL/antmaze/medium-diverse-v1.md", "datasets/D4RL/antmaze/medium-play-v1.md", "datasets/D4RL/antmaze/umaze-diverse-v1.md", "datasets/D4RL/antmaze/umaze-v1.md", "datasets/D4RL/door/cloned-v2.md", "datasets/D4RL/door/expert-v2.md", "datasets/D4RL/door/human-v2.md", "datasets/D4RL/door/index.md", "datasets/D4RL/hammer/cloned-v2.md", "datasets/D4RL/hammer/expert-v2.md", "datasets/D4RL/hammer/human-v2.md", "datasets/D4RL/hammer/index.md", "datasets/D4RL/index.md", "datasets/D4RL/kitchen/complete-v2.md", "datasets/D4RL/kitchen/index.md", "datasets/D4RL/kitchen/mixed-v2.md", "datasets/D4RL/kitchen/partial-v2.md", "datasets/D4RL/minigrid/fourrooms-random-v0.md", "datasets/D4RL/minigrid/fourrooms-v0.md", "datasets/D4RL/minigrid/index.md", "datasets/D4RL/pen/cloned-v2.md", "datasets/D4RL/pen/expert-v2.md", "datasets/D4RL/pen/human-v2.md", "datasets/D4RL/pen/index.md", "datasets/D4RL/pointmaze/index.md", "datasets/D4RL/pointmaze/large-dense-v2.md", "datasets/D4RL/pointmaze/large-v2.md", "datasets/D4RL/pointmaze/medium-dense-v2.md", "datasets/D4RL/pointmaze/medium-v2.md", "datasets/D4RL/pointmaze/open-dense-v2.md", "datasets/D4RL/pointmaze/open-v2.md", "datasets/D4RL/pointmaze/umaze-dense-v2.md", "datasets/D4RL/pointmaze/umaze-v2.md", "datasets/D4RL/relocate/cloned-v2.md", "datasets/D4RL/relocate/expert-v2.md", "datasets/D4RL/relocate/human-v2.md", "datasets/D4RL/relocate/index.md", "index.md", "release_notes/index.md", "tutorials/dataset_creation/README.rst", "tutorials/dataset_creation/custom_space_serialization.rst", "tutorials/dataset_creation/index.rst", "tutorials/dataset_creation/observation_space_subseting.rst", "tutorials/dataset_creation/point_maze_dataset.rst", "tutorials/index.rst", "tutorials/using_datasets/IQL_torchrl.rst", "tutorials/using_datasets/README.rst", "tutorials/using_datasets/behavioral_cloning.rst", "tutorials/using_datasets/index.rst"], "indexentries": {"__call__() (in module minari.episodemetadatacallback)": [[4, "minari.EpisodeMetadataCallback.__call__", false]], "__call__() (in module minari.stepdatacallback)": [[5, "minari.StepDataCallback.__call__", false]], "__len__() (in module minari.data_collector.episodebuffer)": [[3, "minari.data_collector.EpisodeBuffer.__len__", false]], "action (minari.stepdata attribute)": [[9, "minari.StepData.action", false]], "action_space (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.action_space", false]], "actions (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.actions", false]], "actions (minari.episodedata attribute)": [[6, "minari.EpisodeData.actions", false]], "add_step_data() (in module minari.data_collector.episodebuffer)": [[3, "minari.data_collector.EpisodeBuffer.add_step_data", false]], "add_to_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.add_to_dataset", false]], "apply() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.apply", false]], "close() (in module minari.datacollector)": [[2, "minari.DataCollector.close", false]], "combine_datasets() (in module minari)": [[10, "minari.combine_datasets", false]], "create_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.create_dataset", false]], "create_dataset_from_buffers() (in module minari)": [[10, "minari.create_dataset_from_buffers", false]], "create_namespace() (in module minari.namespace)": [[11, "minari.namespace.create_namespace", false]], "data_path (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.data_path", false]], "datacollector (class in minari)": [[2, "minari.DataCollector", false]], "delete_dataset() (in module minari)": [[10, "minari.delete_dataset", false]], "delete_namespace() (in module minari.namespace)": [[11, "minari.namespace.delete_namespace", false]], "download_dataset() (in module minari)": [[10, "minari.download_dataset", false]], "download_namespace_metadata() (in module minari.namespace)": [[11, "minari.namespace.download_namespace_metadata", false]], "episode_indices (minari.minaridataset attribute)": [[7, "minari.MinariDataset.episode_indices", false]], "episodebuffer (class in minari.data_collector)": [[3, "minari.data_collector.EpisodeBuffer", false]], "episodedata (class in minari)": [[6, "minari.EpisodeData", false]], "episodemetadatacallback (class in minari)": [[4, "minari.EpisodeMetadataCallback", false]], "filter_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.filter_episodes", false]], "get_episode_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_episode_metadata", false]], "get_episodes() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_episodes", false]], "get_namespace_metadata() (in module minari.namespace)": [[11, "minari.namespace.get_namespace_metadata", false]], "get_normalized_score() (in module minari)": [[10, "minari.get_normalized_score", false]], "get_size() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_size", false]], "id (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.id", false]], "id (minari.episodedata attribute)": [[6, "minari.EpisodeData.id", false]], "info (minari.stepdata attribute)": [[9, "minari.StepData.info", false]], "infos (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.infos", false]], "infos (minari.episodedata attribute)": [[6, "minari.EpisodeData.infos", false]], "iterate_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.iterate_episodes", false]], "list_local_datasets() (in module minari)": [[10, "minari.list_local_datasets", false]], "list_local_namespaces() (in module minari.namespace)": [[11, "minari.namespace.list_local_namespaces", false]], "list_remote_datasets() (in module minari)": [[10, "minari.list_remote_datasets", false]], "list_remote_namespaces() (in module minari.namespace)": [[11, "minari.namespace.list_remote_namespaces", false]], "load_dataset() (in module minari)": [[10, "minari.load_dataset", false]], "metadata (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.metadata", false]], "minaridataset (class in minari)": [[7, "minari.MinariDataset", false]], "minaristorage (class in minari.dataset.minari_storage)": [[8, "minari.dataset.minari_storage.MinariStorage", false]], "new() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.new", false]], "observation (minari.stepdata attribute)": [[9, "minari.StepData.observation", false]], "observation_space (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.observation_space", false]], "observations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.observations", false]], "observations (minari.episodedata attribute)": [[6, "minari.EpisodeData.observations", false]], "read() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.read", false]], "recover_environment() (in module minari.minaridataset)": [[7, "minari.MinariDataset.recover_environment", false]], "reset() (in module minari.datacollector)": [[2, "minari.DataCollector.reset", false]], "rewards (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.rewards", false]], "sample_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.sample_episodes", false]], "seed (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.seed", false]], "set_seed() (in module minari.minaridataset)": [[7, "minari.MinariDataset.set_seed", false]], "spec (minari.minaridataset attribute)": [[7, "minari.MinariDataset.spec", false]], "split_dataset() (in module minari)": [[10, "minari.split_dataset", false]], "step() (in module minari.datacollector)": [[2, "minari.DataCollector.step", false]], "stepdata (class in minari)": [[9, "minari.StepData", false]], "stepdatacallback (class in minari)": [[5, "minari.StepDataCallback", false]], "termination (minari.stepdata attribute)": [[9, "minari.StepData.termination", false]], "terminations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.terminations", false]], "terminations (minari.episodedata attribute)": [[6, "minari.EpisodeData.terminations", false]], "total_episodes (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.total_episodes", false]], "total_episodes (minari.minaridataset attribute)": [[7, "minari.MinariDataset.total_episodes", false]], "total_steps (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.total_steps", false]], "total_steps (minari.minaridataset attribute)": [[7, "minari.MinariDataset.total_steps", false]], "truncation (minari.stepdata attribute)": [[9, "minari.StepData.truncation", false]], "truncations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.truncations", false]], "truncations (minari.episodedata attribute)": [[6, "minari.EpisodeData.truncations", false]], "update_dataset_from_buffer() (in module minari.minaridataset)": [[7, "minari.MinariDataset.update_dataset_from_buffer", false]], "update_episode_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_episode_metadata", false]], "update_episodes() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_episodes", false]], "update_from_storage() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_from_storage", false]], "update_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_metadata", false]], "upload_namespace() (in module minari.namespace)": [[11, "minari.namespace.upload_namespace", false]]}, "objects": {"minari": [[2, 0, 1, "", "DataCollector"], [6, 0, 1, "", "EpisodeData"], [4, 0, 1, "", "EpisodeMetadataCallback"], [7, 0, 1, "", "MinariDataset"], [9, 0, 1, "", "StepData"], [5, 0, 1, "", "StepDataCallback"], [10, 1, 1, "", "combine_datasets"], [10, 1, 1, "", "create_dataset_from_buffers"], [10, 1, 1, "", "delete_dataset"], [10, 1, 1, "", "download_dataset"], [10, 1, 1, "", "get_normalized_score"], [10, 1, 1, "", "list_local_datasets"], [10, 1, 1, "", "list_remote_datasets"], [10, 1, 1, "", "load_dataset"], [10, 1, 1, "", "split_dataset"]], "minari.DataCollector": [[2, 1, 1, "", "add_to_dataset"], [2, 1, 1, "", "close"], [2, 1, 1, "", "create_dataset"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "step"]], "minari.EpisodeData": [[6, 2, 1, "", "actions"], [6, 2, 1, "", "id"], [6, 2, 1, "", "infos"], [6, 2, 1, "", "observations"], [6, 2, 1, "", "terminations"], [6, 2, 1, "", "truncations"]], "minari.EpisodeMetadataCallback": [[4, 1, 1, "", "__call__"]], "minari.MinariDataset": [[7, 2, 1, "", "episode_indices"], [7, 1, 1, "", "filter_episodes"], [7, 1, 1, "", "iterate_episodes"], [7, 1, 1, "", "recover_environment"], [7, 1, 1, "", "sample_episodes"], [7, 1, 1, "", "set_seed"], [7, 2, 1, "", "spec"], [7, 2, 1, "", "total_episodes"], [7, 2, 1, "", "total_steps"], [7, 1, 1, "", "update_dataset_from_buffer"]], "minari.StepData": [[9, 2, 1, "", "action"], [9, 2, 1, "", "info"], [9, 2, 1, "", "observation"], [9, 2, 1, "", "termination"], [9, 2, 1, "", "truncation"]], "minari.StepDataCallback": [[5, 1, 1, "", "__call__"]], "minari.data_collector": [[3, 0, 1, "", "EpisodeBuffer"]], "minari.data_collector.EpisodeBuffer": [[3, 1, 1, "", "__len__"], [3, 2, 1, "", "actions"], [3, 1, 1, "", "add_step_data"], [3, 2, 1, "", "id"], [3, 2, 1, "", "infos"], [3, 2, 1, "", "observations"], [3, 2, 1, "", "rewards"], [3, 2, 1, "", "seed"], [3, 2, 1, "", "terminations"], [3, 2, 1, "", "truncations"]], "minari.dataset.minari_storage": [[8, 0, 1, "", "MinariStorage"]], "minari.dataset.minari_storage.MinariStorage": [[8, 2, 1, "", "action_space"], [8, 1, 1, "", "apply"], [8, 2, 1, "", "data_path"], [8, 1, 1, "", "get_episode_metadata"], [8, 1, 1, "", "get_episodes"], [8, 1, 1, "", "get_size"], [8, 2, 1, "", "metadata"], [8, 1, 1, "", "new"], [8, 2, 1, "", "observation_space"], [8, 1, 1, "", "read"], [8, 2, 1, "", "total_episodes"], [8, 2, 1, "", "total_steps"], [8, 1, 1, "", "update_episode_metadata"], [8, 1, 1, "", "update_episodes"], [8, 1, 1, "", "update_from_storage"], [8, 1, 1, "", "update_metadata"]], "minari.namespace": [[11, 1, 1, "", "create_namespace"], [11, 1, 1, "", "delete_namespace"], [11, 1, 1, "", "download_namespace_metadata"], [11, 1, 1, "", "get_namespace_metadata"], [11, 1, 1, "", "list_local_namespaces"], [11, 1, 1, "", "list_remote_namespaces"], [11, 1, 1, "", "upload_namespace"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "function", "Python function"], "2": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:class", "1": "py:function", "2": "py:attribute"}, "terms": {"": [2, 4, 5, 10, 12, 13, 14, 16, 17, 18, 19, 20, 32, 56, 58, 60, 61, 63, 65], "0": [2, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 60, 61, 63, 65], "000": [61, 63], "0003": 63, "005": 63, "01": 56, "0123456789abcdefghijklmnopqrstuvwxyzabcdeeeffghijklmnnoopqrrssttuvwxyzz": [35, 36], "03ac13": [14, 55], "04": 56, "05": 56, "07": 56, "07219": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "08": 56, "09": 56, "0x11f2608b0": 58, "0x12253a940": 58, "0x7f81d3e221f0": [35, 36], "1": [2, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 63, 65], "10": [12, 13, 56, 58, 60, 61, 63], "100": [2, 10, 12, 14, 38, 39, 40, 55, 56, 63], "1000": [12, 16, 17, 18, 19, 56, 63], "1000000": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 26, 27, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55], "1000070": 35, "10010": 36, "1006729": 12, "10087": [25, 29, 41, 54], "101": 56, "10174": 35, "102": 56, "104": 56, "105": 56, "107": 56, "1077": [14, 55], "108": 56, "109": 56, "1096": [12, 14, 55], "10_000": [61, 63], "11": 56, "110": 56, "1103": 12, "111": 56, "112": 56, "11310": 28, "116": 56, "11956": 32, "12": [12, 56, 63], "121": 56, "123": [12, 56, 61], "124": 56, "126": 56, "128": [56, 63, 65], "129": 56, "13": [12, 56], "130": 56, "132": 56, "13210": [49, 50], "133": 56, "137": 56, "139": 56, "14": [35, 36, 56], "1400": 63, "1430": [20, 21], "144": 56, "148": 56, "15": 12, "151": 56, "153": 56, "155": 56, "156560": [33, 34], "157": 56, "158": 56, "160": 56, "161": 56, "162": 56, "163": 56, "164": 56, "165": 56, "167": 56, "169": 56, "16x16": 58, "17": [12, 56], "170": 56, "1709": [25, 29, 41, 54], "171": 56, "172": 56, "177": 56, "18": [12, 56], "183": 56, "1872": 63, "19": [12, 31, 56], "1910": 32, "196": 56, "1_000": [63, 65], "1e": 61, "1f": 63, "2": [2, 10, 12, 15, 16, 17, 18, 19, 20, 21, 25, 29, 30, 31, 32, 33, 34, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 58, 60, 63], "20": [12, 56, 63], "200": [22, 23, 24, 26, 27, 28, 51, 52, 53], "2004": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "2017": [25, 29, 41, 54], "2019": 32, "2020": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "2021": [15, 63], "2022": 56, "2023": [56, 63], "2024": 56, "2059": 12, "21": 12, "211": 56, "218": 56, "22": [12, 15, 56], "224": 56, "23": 12, "239": 56, "24": [14, 25, 29, 38, 39, 40, 41, 54, 63], "240": 56, "241": 56, "244": 56, "245": 56, "25": [12, 14, 24, 25, 28, 29, 40, 41, 53, 54, 55, 56, 63], "255": [35, 36, 58], "256": [63, 65], "26": [26, 27, 28, 56], "268": 15, "27": [16, 17, 18, 19, 20, 21, 56], "28": [12, 22, 23, 24, 56], "280": 31, "29": 56, "2d": [15, 30], "2f": 63, "3": [2, 10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 63], "30": [51, 52, 53, 63], "300": [47, 48, 49, 50], "305": 56, "31": 56, "32": 65, "3360": [43, 44], "34": 56, "3606": 26, "3736": [14, 38], "3758": 51, "39": [12, 22, 23, 24, 51, 52, 53], "4": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 60, 61], "42": [58, 60, 63, 65], "4209": 31, "4356": [14, 55], "4358": 22, "45": [14, 38, 39, 40, 63], "450": [33, 34], "46": [26, 27, 28], "4752": [45, 46], "480": 63, "4958": [14, 39], "499206": [14, 39], "5": [12, 14, 61, 63], "50": [22, 25, 26, 29, 38, 41, 51, 54, 61, 63], "500": 65, "5000": [12, 14, 23, 27, 40, 52, 55, 63], "500000": [14, 38], "5025": 12, "50_000": 63, "52": 56, "54": 56, "55": 56, "57": 56, "59": [31, 33, 34], "590": 36, "6": [12, 56], "60": 56, "600": [45, 46], "604": 14, "605": 12, "621": [33, 34], "638": 14, "6729": [12, 14, 24, 55], "69": 63, "7": [12, 14, 31, 33, 34, 35, 36, 55, 56, 58, 63], "700": [20, 21], "71": 56, "73": 56, "75": 56, "77": 56, "8": [12, 15, 16, 17, 18, 19, 20, 21, 30, 42, 56, 61], "80": [16, 17, 18, 19, 56], "800": [43, 44], "82": 56, "83": 56, "84": 56, "86": 56, "87": 56, "88": 56, "884": 63, "9": [12, 31, 33, 34], "90": [20, 21, 56], "900": 63, "92": 56, "93": 56, "95": 56, "9525": [47, 48], "96": 56, "99": [56, 61, 63], "9942": 53, "A": [2, 8, 13, 32, 55, 61, 63], "And": 65, "As": [6, 13, 56, 61, 65], "At": [16, 17, 18, 19, 20], "But": [58, 63], "By": [61, 63], "For": [1, 2, 10, 11, 12, 13, 30, 56, 58, 61, 65], "If": [2, 7, 8, 10, 11, 12, 13, 14, 56, 58, 61, 63], "In": [12, 13, 56, 58, 60, 61, 63, 65], "It": [56, 61, 63], "No": 58, "Not": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 51, 52, 53], "On": [13, 61, 63], "The": [2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 60, 61, 65], "Then": [58, 61, 63], "There": [12, 25, 29, 41, 54, 63], "These": [10, 14, 25, 29, 30, 32, 41, 42, 54, 56, 61], "To": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 63, 65], "With": 14, "_": [2, 12, 58, 60, 61, 63, 65], "_0": 61, "__call__": [4, 5, 60, 61], "__init__": [61, 65], "__len__": 3, "_build": 1, "_check_valid_cel": 61, "_gen_miss": [35, 36, 58], "_index_0": 56, "_index_1": 56, "_max": 10, "_min": 10, "_score": 10, "_script": 56, "a1efe4": [14, 55], "a256f8": 14, "a5a5a1": 14, "a_hat": 65, "a_pr": 65, "a_t": 63, "ab": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "abil": 12, "abl": [12, 42], "abort": 14, "about": [1, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58], "abov": [12, 56, 58, 60, 63], "abspath": 65, "abstract": 12, "ac": 65, "access": [8, 12, 14, 56, 61], "account": 61, "accumul": [16, 17, 18, 19, 20, 21, 61, 65], "accumulated_rew": 65, "accur": 63, "achiev": [12, 61, 65], "achieved_go": [16, 17, 18, 19, 20, 21, 31, 33, 34, 43, 44, 45, 46, 47, 48, 49, 50, 60, 61], "achieved_goal_cel": 61, "acrobot": 12, "across": [10, 13, 56], "act": 56, "action": [2, 3, 5, 6, 8, 9, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "action_id": 61, "action_idx": 61, "action_spac": [2, 8, 10, 12, 13, 56, 58, 60, 61, 65], "action_space_subset": 60, "action_spec": 63, "activ": [15, 63], "activation_class": 63, "activation_fn": 63, "actor": 63, "actor_extractor": 63, "actor_mlp": 63, "actor_modul": 63, "actor_net": 63, "acttyp": [2, 10], "actual": 61, "actuat": [30, 42], "ad": [5, 7, 8, 10, 12, 13, 43, 44, 45, 46, 47, 48, 49, 50, 56, 60], "adam": [15, 63, 65], "add": [2, 3, 4, 5, 7, 8, 14, 43, 44, 45, 46, 47, 48, 49, 50, 56, 61, 63], "add_step_data": 3, "add_to_dataset": [2, 12], "addit": [2, 5, 7, 11, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "addition": [15, 56], "additional_dataset": 56, "additional_group": 56, "additional_wrapp": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "address": 61, "adher": 56, "adjust": 61, "adroit_door": [22, 23, 24], "adroit_h": 14, "adroit_hamm": [26, 27, 28], "adroit_hand": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 51, 52, 53], "adroit_pen": [14, 38, 39, 40], "adroit_reloc": [51, 52, 53], "adroithanddoor": [12, 13, 22, 23, 24, 25, 30, 56], "adroithanddoorenv": [22, 23, 24], "adroithandhamm": [26, 27, 28, 29, 30, 56], "adroithandhammerenv": [26, 27, 28], "adroithandpen": [14, 30, 38, 39, 40, 41, 56, 63], "adroithandpenenv": [38, 39, 40], "adroithandreloc": [30, 51, 52, 53, 54, 56], "adroithandrelocateenv": [51, 52, 53], "advantag": [61, 63], "after": [2, 4, 6, 9, 10, 13, 14, 56, 61, 65], "again": [16, 17, 18, 19, 20, 21], "agent": [9, 15, 16, 17, 18, 19, 20, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 60, 61, 63, 65], "aggress": 61, "agnost": [2, 63], "aim": [13, 61, 63], "al": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61, 63], "alex": [12, 16, 17, 18, 19, 20, 21], "alexdavei": 56, "alexdavey0": [16, 17, 18, 19, 20, 21], "algo": 65, "algorithm": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 63], "algorithm_nam": [2, 10, 12, 13, 58, 60, 61, 65], "all": [8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 30, 31, 32, 55, 56, 58, 62, 63, 65], "allow": [12, 13, 56, 61, 65], "alon": 61, "along": [30, 42], "alreadi": [8, 12, 14, 56, 60, 61, 63], "also": [10, 12, 14, 16, 17, 18, 19, 20, 21, 55, 56, 58, 60, 61, 63], "alwai": 61, "among": 56, "amount": [12, 61], "amp": 56, "an": [4, 7, 10, 11, 12, 13, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 47, 48, 51, 52, 53, 54, 56, 58, 61, 63], "ani": [2, 5, 6, 7, 8, 9, 10, 11, 12, 56, 60, 61], "annot": 56, "anoth": [2, 5, 8, 12, 13, 25, 29, 41, 54, 61, 63], "anssi": 15, "ant": [16, 17, 18, 19, 20, 21, 30], "ant_maze_v4": [16, 17, 18, 19, 20, 21], "antmaz": [12, 16, 17, 18, 19, 20, 21], "antmaze_larg": [15, 17], "antmaze_large_diverse_gr": [15, 16], "antmaze_medium": [15, 19], "antmaze_medium_diverse_gr": [15, 18], "antmaze_umaz": [15, 20, 21], "antmazeenv": [16, 17, 18, 19, 20, 21], "antonin": 15, "apart": 56, "api": [11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 61, 65], "appear": [12, 56], "append": [3, 8, 12, 56, 63], "appli": [8, 58], "applic": [12, 56], "appreci": 56, "approach": 61, "appropri": 13, "approx": 63, "approxim": 63, "apr": [15, 42, 61], "apt": 63, "ar": [2, 6, 8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 51, 52, 53, 54, 55, 56, 58, 61, 63], "arang": 63, "aravind": [25, 29, 41, 54], "aravindr93": 14, "arbitrari": [13, 56], "arbitrarili": 13, "arena": [42, 47, 48], "arg": [14, 56, 61, 63], "argmax": [61, 65], "argument": [4, 5, 10, 12, 13, 56], "argv": 65, "around": [58, 63], "arrai": [10, 61], "arrow": [13, 56], "arxiv": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "as_tensor": 65, "ashlei": 15, "assert": [22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 58, 65], "assign": 10, "associ": 13, "attach": 13, "attempt": 63, "attr": 56, "attribut": [2, 4, 10, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56], "author": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 61, 65], "author_email": [2, 10, 12, 13, 56, 58, 61, 65], "auto": [63, 65], "auto_cast_to_devic": 63, "autobuild": 1, "automat": [1, 2, 13, 56], "autoreset": 14, "auxiliari": 2, "avail": [7, 10, 12, 14, 55, 56, 58, 63], "averag": [2, 10, 63], "avg": 63, "avjmachin": 56, "avoid": [56, 63], "awai": 56, "ax": 63, "axi": [30, 42, 61, 63], "b": [1, 14, 55], "b64encod": 63, "back": [58, 61], "background": 56, "backpropag": 63, "backward": [63, 65], "badg": 56, "balanc": 65, "balisujohn": 56, "ball": [15, 30, 42, 54, 61], "bamboofungu": 56, "bar": 14, "base": [12, 14, 56, 61, 63], "base64": 63, "base_env": 63, "baselin": 15, "baselines3": [15, 65], "basi": 56, "basic": [56, 63], "batch": [63, 65], "batch_first": 65, "batch_siz": [63, 65], "becaus": [15, 16, 17, 18, 19, 20, 21, 42, 63], "been": [12, 42, 56], "befor": [2, 12, 58, 61, 63], "begin": [16, 17, 18, 19, 20, 65], "behav": 63, "behavior": [56, 61, 62, 63, 66], "behavioral_clon": 65, "behaviour": 63, "being": [2, 10, 13, 31, 32, 33, 34, 42, 43, 45, 47, 49], "bellman": 61, "bellow": 56, "belong": 5, "below": [14, 61, 63], "benchmark": [30, 63], "best": 63, "best_model": 65, "beta": [56, 63], "between": [10, 43, 45, 47, 49, 61], "bias": 61, "bind": 61, "bit": [61, 63], "black": 56, "blob": [58, 61], "block": 63, "blue": 63, "board": 29, "bool": [2, 5, 7, 9, 10, 11, 56, 63], "boolean": 10, "both": [8, 13, 14, 58, 60], "bottom": [31, 33, 34], "bound": [13, 61, 63], "box": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 65], "break": [12, 56, 61, 65], "bucket": [12, 13, 55, 56], "buffer": [2, 3, 7, 8, 10, 12, 56], "bug": 56, "bugfix": 56, "build": [14, 56], "burner": [31, 33, 34], "c": [12, 16, 18, 32, 56], "cabinet": [31, 32, 33, 34], "cach": [2, 12, 56, 63], "calcul": [10, 63], "call": [2, 5, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56], "callabl": [2, 7, 8, 10, 12, 56, 58], "callback": [2, 4, 5, 56, 60, 61], "can": [2, 4, 5, 7, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "capabl": 12, "captur": 63, "care": 58, "cart": 65, "cartpol": [11, 12, 56, 65], "case": [12, 56, 61], "cd": [1, 12], "cell": [16, 18, 61], "cell_rowcol_to_xi": 61, "cell_to_st": 61, "cell_xy_to_rowcol": 61, "center": 14, "certain": [7, 12, 41], "cff": 56, "challeng": [15, 63], "chang": [1, 11, 56, 61], "changelog": 56, "characterist": [2, 61], "charg": 56, "charset": [13, 35, 36], "check": [12, 14, 56, 61], "checkpoint": 56, "choic": 63, "choos": [13, 58, 60], "chosen": 61, "ci": 56, "citat": 56, "class": [2, 3, 4, 5, 6, 7, 8, 9, 13, 56, 60, 61, 63, 65], "classic": [12, 61, 65], "classic_control": 12, "classif": 65, "clean": 58, "clear": 2, "clear_episode_buff": 56, "cli": [55, 56], "clip": 61, "clone": [1, 12, 14, 25, 29, 41, 54, 55, 56, 62, 63, 66], "close": [2, 32, 61, 63, 65], "cloud": [12, 13, 56], "cmmcirvin": 56, "code": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 62, 63, 65], "code_permalink": [2, 10, 12, 13, 58, 61, 65], "codelink": 56, "colab": 63, "collate_fn": 65, "collect": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 59, 62, 63], "collector": [2, 61], "collector_env": [56, 61], "collis": 61, "color": [14, 55], "com": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61], "combin": [56, 61], "combine_dataset": [10, 12, 56], "combined_dataset": 10, "come": [13, 14], "command": [12, 14, 56, 65], "commit": 56, "common": [12, 13], "compar": [6, 60], "comparison": 10, "compat": [10, 12, 14, 56, 65], "compatible_minari_vers": 10, "complement": 2, "complet": [32, 33, 34, 56, 63], "complex": [15, 25, 29, 30, 41, 54, 56], "compli": 56, "compliant": [13, 56], "compon": 61, "component_1": 56, "component_2": 56, "compris": 12, "comput": [2, 10, 12, 13, 63], "compute_act": 61, "compute_reward_matrix": 61, "compute_transition_matrix": 61, "concaten": 63, "condit": [7, 12, 56, 63], "configur": [32, 56, 63], "confirm": [14, 63], "conflict": 63, "conjunct": 63, "consid": [8, 56, 61, 63], "consider": 56, "consist": [13, 42, 63], "constantli": 56, "construct": 61, "contact": [11, 12, 58, 65], "contain": [1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 47, 48, 49, 50, 51, 52, 53, 56], "content": [13, 14], "continu": [10, 12, 13, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61], "continuing_task": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 61], "contribut": [1, 12, 56, 61], "contributor": 56, "control": [12, 15, 42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 63, 65], "conveni": 63, "convent": 56, "convers": [56, 58], "convert": [2, 61, 63], "coordin": 61, "copi": [56, 63], "core": 58, "corl": 63, "corr": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "correct": [56, 61, 63], "correspond": [2, 10, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 61, 65], "could": [15, 63], "cover": 63, "coverag": 56, "cpu": 63, "creat": [2, 5, 7, 8, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56, 58, 60, 63, 65], "create_dataset": [2, 12, 56, 58, 60, 61, 65], "create_dataset_from_buff": [10, 12, 13, 56], "create_dataset_from_collector_env": 56, "create_namespac": 11, "creation": [2, 12, 13, 56], "credenti": 11, "cross": 65, "crossentropyloss": 65, "cuda": 63, "cumul": [61, 63], "curat": 56, "current": [5, 10, 12, 13, 14, 56, 61, 63], "current_cel": 61, "current_control_target_id": 61, "current_control_target_xi": 61, "current_st": 61, "custom": [2, 4, 12, 56, 59, 61, 62], "custom_space_seri": 58, "customstepdatacallback": 5, "customsubsetstepdatacallback": 60, "cython": 56, "d": [12, 63], "d4rl": [10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 59, 62, 63], "da": 61, "dampen": 61, "dapg": [14, 23, 24, 25, 27, 28, 29, 39, 40, 41, 52, 53, 54], "data": [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 29, 30, 32, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 58, 63, 65], "data_collector": 60, "data_format": [2, 8, 10, 56], "data_path": 8, "data_url": 63, "databas": [10, 11, 14], "databefor": 2, "dataclass": [8, 56], "datacollector": [4, 12, 13, 56, 58, 60, 61, 65], "datacollectorv0": 56, "dataload": [12, 56, 65], "datas": 8, "dataset": [2, 4, 5, 6, 7, 11, 15, 25, 29, 30, 32, 37, 41, 42, 54, 55, 56, 58, 60, 63], "dataset_cr": [56, 58, 61], "dataset_id": [2, 10, 11, 12, 13, 56, 58, 60, 61, 63, 65], "dataset_nam": [2, 10, 13, 14, 61], "dataset_s": 56, "dataset_v1": 56, "dataset_v2": 56, "dataset_v3": 56, "datasets_to_combin": [10, 56], "davei": [12, 16, 17, 18, 19, 20, 21], "de": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 51, 52, 53], "decent": 63, "decod": 63, "deep": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "def": [5, 58, 60, 61, 63, 65], "default": [2, 5, 7, 8, 10, 11, 12, 13, 63], "default_interaction_typ": 63, "defin": [13, 58, 60, 65], "definit": 56, "del": [58, 60], "deleg": 56, "delet": [58, 60], "delete_dataset": [10, 58, 60], "delete_namespac": 11, "demonstr": [22, 24, 25, 26, 28, 29, 31, 32, 38, 40, 41, 51, 53, 54, 63], "dens": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 42, 51, 52, 53, 56, 63], "depend": [12, 13, 56], "deprec": 56, "descent": 63, "describ": [11, 13, 56], "descript": [2, 10, 11, 13, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 56], "deseri": 58, "deserialize_custom_spac": 58, "deserialize_spac": 58, "design": 63, "desir": [32, 61], "desired_cel": 61, "desired_go": [16, 17, 18, 19, 20, 21, 31, 33, 34, 43, 44, 45, 46, 47, 48, 49, 50, 60, 61], "detail": 63, "detect": 56, "determin": 61, "determinist": [12, 61], "develop": 56, "deviat": [13, 61], "devic": [14, 63], "dexter": [25, 29, 41, 54], "df8ff078652a": [15, 42, 61], "dict": [2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 16, 17, 18, 19, 20, 21, 31, 33, 34, 35, 36, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 60], "dict_kei": 60, "dictionari": [2, 3, 5, 7, 8, 9, 10, 12, 13, 56, 59, 61, 62, 63], "differ": [10, 12, 13, 42, 56, 58, 61, 63], "dimens": [63, 65], "dimension": [13, 25, 29, 41, 54], "dir": 56, "direct": [35, 36, 58, 63], "directli": [12, 56, 61, 63, 65], "directori": [2, 8, 11, 12, 63], "dirhtml": 1, "disabl": 2, "disable_env_check": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "discount": 61, "discret": [13, 35, 36, 56, 58, 61, 65], "disk": [8, 12, 13, 56, 58, 60, 65], "displai": [63, 65], "dist": 61, "distanc": [43, 45, 47, 49], "distribut": [25, 29, 41, 54, 63], "distribution_class": 63, "distribution_kwarg": 63, "divers": [12, 15], "divid": [12, 61], "do": [61, 63], "doc": [1, 56, 58, 61], "document": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "doe": 56, "doesn": [8, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56, 61], "dof": [15, 25, 29, 30, 41, 54, 63], "domain": [15, 25, 29, 30, 41, 42, 54], "don": [13, 56, 58, 60, 61], "done": [12, 61, 63, 65], "door": [10, 12, 13, 14, 22, 23, 24, 30, 32, 55, 56], "dormann": 15, "dot": [61, 63], "doubl": 63, "doubletofloat": 63, "down": 61, "download": [13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 62, 63, 65], "download_dataset": 10, "download_namespace_metadata": 11, "driven": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "dt": 61, "dtype": [56, 60, 61, 63], "due": [56, 61], "dump": 58, "dure": [12, 13, 56, 61, 63], "dynam": 61, "e": [1, 7, 10, 12, 56, 63], "e731": 58, "each": [2, 4, 5, 6, 8, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 60, 61, 63, 65], "earlier": 58, "edit": [2, 5], "effect": [25, 29, 41, 54], "effici": 56, "element": [6, 13], "elif": 61, "elimin": 61, "ell": 63, "elliottow": 56, "els": [12, 56, 61, 63], "email": [2, 10, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "embed": 63, "empti": [11, 58, 61], "emptyenv": 58, "enabl": 58, "encapsul": 13, "encount": 58, "encourag": [13, 56], "end": [13, 56], "enerrio": 56, "enhanc": 56, "ensur": 63, "entri": 61, "entropi": 65, "entry_point": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "env": [2, 5, 7, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "env_id": 63, "env_nam": [2, 10, 13], "env_spec": [8, 13], "envid": 2, "environ": [2, 5, 6, 7, 8, 9, 10, 13, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 55, 56, 58, 60, 61, 65], "environment_st": 5, "envspec": [2, 8, 10, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "eol": 56, "ep": 12, "episod": [2, 3, 4, 6, 7, 8, 10, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "episode_0": 56, "episode_1": 56, "episode_2": 56, "episode_id": [12, 56], "episode_indic": [7, 8, 12], "episode_metadata_callback": [2, 4], "episode_reward": 63, "episodebuff": [7, 8, 10], "episodedata": [7, 12, 56], "episodemetadatacallback": [2, 13, 56], "episodes_gener": 12, "epoch": 65, "epsiodedata": 8, "equal": [2, 10, 13], "equat": 61, "equiv": 63, "equlival": 61, "ernestu": 15, "error": [10, 56, 58, 61, 63], "essenti": 63, "estim": [2, 10, 63], "et": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61, 63], "etc": 63, "euclidean": [43, 45, 47, 49], "evad": 61, "eval_env": [2, 7, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "eval_env_spec": [12, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53], "eval_interv": 63, "eval_reward_log": 63, "eval_td": 63, "evalu": [2, 7, 10, 12, 56, 63, 65], "evaluate_polici": 63, "everi": [1, 10, 12, 13, 21, 61, 63], "everyth": 63, "exampl": [2, 10, 11, 12, 13, 14, 56, 58, 61, 62, 63], "example_env": 63, "except": [8, 56, 58, 63], "excit": 56, "execut": 65, "exerpt": 56, "exist": [8, 11, 14, 56, 60, 61], "exit": 14, "expect": 60, "expectil": 63, "experienc": 56, "experiment": 11, "expert": [2, 10, 12, 13, 14, 15, 22, 25, 26, 29, 36, 37, 38, 41, 51, 54, 55, 56, 63, 65], "expert_polici": [2, 10], "expertpolici": [36, 65], "explain": [56, 61], "explicit": [56, 63], "explicitli": 56, "explor": 56, "exploration_act": 61, "explorationtyp": 63, "export": [12, 56], "extend": [12, 60], "extra": [2, 4, 5, 56, 61], "extract": 63, "extrapol": 63, "f": [12, 14, 56, 58, 60, 63, 65], "f01e2c": 14, "f4bf75": 14, "facilit": [10, 12, 56], "factor": 61, "factori": 3, "fail": [16, 17, 18, 19, 20, 21, 56], "fals": [2, 7, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 60, 61, 63, 65], "familiar": 63, "farama": [1, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 61, 63, 65], "favor": 56, "fc1": 65, "fc2": 65, "fc3": 65, "featur": [11, 12, 55, 56, 65], "fed000": 14, "few": 56, "ff00ff": [14, 55], "ffmpeg": 63, "field": [13, 56, 63], "fig": 63, "figsiz": 63, "figur": 63, "file": [2, 4, 11, 12, 13, 14, 55, 56, 60], "file_fold": 56, "filter": [7, 55, 56], "filter_dataset": [12, 56], "filter_episod": [7, 12, 56], "final": [6, 12, 15, 56, 58, 60, 61, 63], "final_scor": 63, "find": 60, "fine": [14, 23, 25, 27, 29, 39, 41, 52, 54], "first": [11, 12, 56, 58, 60, 61, 63], "fit": [60, 63], "fix": [21, 30, 42, 56, 63], "flag": [10, 56, 63], "flatten": 56, "flexibl": 12, "flip": [16, 17, 18, 19, 20, 21, 32], "float": [2, 8, 10, 13, 60, 63], "float32": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 61, 65], "float64": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 60, 63], "floppy_disk": 56, "folder": [1, 65], "follow": [2, 5, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 61, 63], "font": [14, 55], "forc": [10, 14, 30, 42, 61], "force_download": [10, 56], "form": [10, 13, 61], "format": [2, 8, 10, 12, 13, 56, 58], "formula": [10, 61], "forward": [11, 13, 63, 65], "found": [10, 13], "foundat": [1, 12, 14, 30, 56, 58, 61], "four": 65, "fourroom": [30, 37], "fourroomsenv": [35, 36], "fp": 63, "frac": 10, "frame": 63, "framework": 63, "franka_kitchen": [31, 33, 34], "frankakitchen": [30, 31, 32, 33, 34, 56], "from": [2, 5, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 60, 61, 63, 65], "from_pixel": 63, "froze": 56, "fu": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "full": [4, 8, 12, 36, 37, 56, 63], "fulli": 56, "function": [7, 8, 10, 12, 13, 14, 35, 36, 42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 61, 63, 65], "fundament": [15, 42, 61], "futur": [11, 12, 56, 61], "g": [12, 16, 17, 18, 19, 20, 21, 35, 36, 43, 44, 45, 46, 47, 48, 49, 50, 63], "gain": 61, "gamma": [61, 63], "gather": 63, "gcp": [12, 13, 55, 56], "gen_dataset_md": 56, "gener": [2, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 60, 61], "generate_path": 61, "get": [7, 8, 10, 12, 56, 58, 60, 61, 63, 65], "get_episod": 8, "get_episode_metadata": [8, 13], "get_namespace_metadata": 11, "get_next_st": 61, "get_normalized_scor": [2, 10, 56], "get_q_valu": 61, "get_siz": 8, "git": [1, 12], "github": [1, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61], "give": [12, 13, 14, 61, 63], "given": [12, 13, 14], "gleav": 15, "global": [2, 13, 61], "global_target_id": 61, "global_target_xi": 61, "glr": 56, "gmail": [16, 17, 18, 19, 20, 21, 35, 36], "go": [1, 61], "goal": [15, 16, 17, 18, 19, 20, 21, 32, 36, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 58, 60, 61, 63], "goal_cel": 61, "goe": [36, 37], "googl": [13, 56, 63], "gradient": 63, "grahamannett": 56, "greater": [12, 56], "green": [58, 63], "grid": 61, "gridworld": 37, "group": [2, 4, 10, 12, 13, 14, 30, 56, 61], "gt": 56, "guarante": 13, "gupta": 32, "gym": [2, 5, 7, 10, 12, 56, 58, 60, 61, 63, 65], "gymansium": 12, "gymenv": 63, "gymnaisum": 14, "gymnasium": [2, 5, 7, 8, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "gymnasium_robot": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "gynasium": 56, "h5py": 56, "ha": [12, 21, 42, 56, 61, 63], "hammer": [26, 27, 28, 30, 56], "hand": [13, 16, 18, 25, 29, 41, 54, 61, 63], "hand_dapg": [14, 25, 29, 30, 41, 54], "handl": [8, 12, 55], "hat": 63, "hausman": 32, "have": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 60, 61, 63, 65], "hdf5": [2, 4, 8, 13, 14, 55, 56, 60, 61], "help": [14, 56, 61], "helper": 63, "here": [63, 65], "hesit": 56, "hidden": 56, "hidden_s": 63, "hierarch": 12, "high": [25, 29, 41, 54, 56, 60, 61, 63], "higher": 61, "highli": 56, "hill": 15, "hing": [31, 33, 34], "hood": 63, "horizon": 32, "host": [12, 14, 25, 29, 30, 32, 41, 54, 55], "how": [1, 2, 56, 58, 60, 61, 63, 65], "howev": [13, 42, 56, 58, 61, 63, 65], "howuhh": 56, "href": 14, "html": 63, "http": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 65], "hub": 56, "human": [10, 12, 13, 14, 22, 25, 26, 29, 38, 41, 51, 54, 55, 56, 63, 65], "hyperparamet": 63, "hypothet": [2, 10], "i": [1, 2, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 32, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 58, 60, 63, 65], "id": [2, 3, 6, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 61, 65], "idea": 56, "identifi": [2, 10, 11, 13], "ignor": [56, 63], "im": 56, "imag": [35, 36, 58, 63], "imit": [22, 25, 26, 29, 32, 38, 41, 51, 54], "implement": [14, 15, 61, 63], "implicit": [62, 66], "implicitli": 63, "import": [2, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63], "import_bugfix": 56, "improv": [56, 63], "imshow": 63, "in_kei": 63, "includ": [6, 13, 31, 32, 34, 42, 56, 63], "incompat": 14, "incorrect": [8, 56], "increas": 6, "indic": [2, 7, 8, 10, 12, 56], "inf": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 60], "infer": 63, "influenc": [61, 63], "info": [2, 3, 5, 6, 9, 12, 13, 56, 61, 65], "inform": [1, 2, 5, 7, 13, 56, 61], "infos_dataset": 56, "infos_subgroup": 56, "init": 56, "initi": [2, 6, 7, 12, 13, 56, 58, 60, 61, 63, 65], "initialis": 63, "input": [5, 7, 12, 13, 63, 65], "input_dim": 65, "insid": 58, "inspir": 61, "instabl": 61, "instal": [1, 10, 14, 55, 56, 58, 63, 65], "instanc": [7, 56], "instanti": 14, "instead": [12, 13, 56, 61, 63], "instruct": 56, "int": [2, 3, 6, 7, 8, 10, 13, 56, 61], "int64": [56, 65], "int_": [7, 61], "integ": 13, "intend": 7, "interact": 32, "interest": 63, "interfac": 12, "intern": [12, 56], "introduc": [15, 25, 29, 41, 54, 56, 63], "invers": 63, "involv": [30, 42, 61], "ipynb": [58, 60, 61, 63, 65], "ipython": 63, "iql": 63, "iql_torchrl": 63, "iqlloss": 63, "is_avail": 63, "is_shar": 63, "isinst": 65, "isol": 56, "issu": [56, 63], "item": [2, 61, 63, 65], "iter": [7, 8, 12, 13, 15, 42, 61, 63], "iterate_episod": [7, 12, 56], "its": [10, 56, 58, 61, 63], "itself": 12, "j": 61, "jamartinh": 56, "josephcarrino": 56, "journal": 15, "json": [13, 14, 56, 58], "jupyt": [58, 60, 61, 62, 63, 65], "just": [12, 58, 63], "justin": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "k": 32, "k_": 61, "k_d": 61, "k_i": 61, "k_p": 61, "kabuki": 56, "kaixin96": 56, "kanervisto": 15, "keep": [12, 56], "kei": [2, 5, 8, 10, 12, 14, 56, 60, 61, 63], "kept": 13, "kernel": 63, "kettl": [31, 32, 33, 34], "key_fil": 14, "key_path": 11, "kitchen": [30, 31, 33, 34, 56], "kitchenenv": [31, 33, 34], "kitsch": 56, "know": 61, "kostrikov": 63, "kumar": 32, "kwarg": [2, 5, 7, 11, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 60], "l": 63, "l2": 63, "l_": 63, "l_2": 63, "l_pi": 63, "l_q": 63, "l_v": 63, "lag": 63, "lambda": [7, 12, 56, 58, 61], "lambert": [15, 42, 61], "larg": [12, 15, 42, 56], "larger": [56, 61, 63], "largest": 56, "last": 56, "last_episode_id": 56, "later": [2, 10, 56, 63], "latest": [10, 14, 56, 61], "latest_vers": 10, "latter": [10, 13, 63], "layer": 63, "lazcano": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 51, 52, 53], "lazi": 63, "lazylinear": 63, "lead": [13, 16, 17, 18, 19, 20, 21, 61], "learn": [12, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 55, 56, 58, 60, 61, 62, 65, 66], "learnin": [15, 42, 61], "leav": 12, "left": [12, 61, 63], "leftarrow": [61, 63], "len": [61, 63], "length": [3, 65], "less": 61, "let": [58, 60, 61, 65], "level": 13, "levin": 32, "lib": 63, "librari": [12, 56, 58, 65], "light": [31, 32, 33, 34], "like": [11, 12, 14, 58, 63, 65], "limit": [61, 63], "linalg": 61, "line": [14, 60], "linear": 65, "link": [2, 10, 12, 13], "linux": 12, "list": [2, 3, 7, 8, 12, 13, 55, 56, 63, 65], "list_local_dataset": [10, 12, 56, 60], "list_local_namespac": 11, "list_remote_dataset": [10, 56], "list_remote_namespac": 11, "ll": [58, 60], "load": [2, 11, 13, 56, 58, 63, 65], "load_dataset": [2, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 65], "loc": 63, "local": [10, 13, 56, 58, 60, 63, 65], "local_dataset": 60, "locat": [12, 15, 16, 17, 18, 19, 20, 21, 30, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61, 63], "log": [56, 63, 65], "long": [32, 61], "longer": 56, "look": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58], "loop": [12, 63, 65], "loos": 56, "lose": 12, "loss": 65, "loss_actor": 63, "loss_dict": 63, "loss_fn": 65, "loss_funct": 63, "loss_log": 63, "loss_modul": 63, "loss_qvalu": 63, "loss_valu": 63, "lost": 56, "low": [56, 60, 61, 63], "lower": 13, "lr": 63, "lynch": 32, "m_": 63, "machin": [13, 15], "maco": 12, "made": [1, 56], "mai": [11, 12, 61, 63], "main": [2, 7, 56, 58, 61, 63], "main_data": [14, 55, 56], "major": 56, "make": [1, 2, 7, 12, 56, 58, 60, 61, 63, 65], "make_value_estim": 63, "manag": 56, "mandatori": [13, 56], "mani": 13, "manipul": [25, 29, 41, 54, 63], "manual_se": [63, 65], "map": [12, 16, 18, 61, 63], "map_length": 61, "map_width": 61, "margin": 63, "markdown": 56, "markovian": [15, 42], "master": 61, "match": 10, "mathbb": 63, "mathcal": 63, "matplotlib": 63, "matrix": 61, "max": [61, 63], "max_": [61, 63], "max_a": 63, "max_episode_step": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 61, 63], "max_step": 63, "maximilian": 15, "maximis": 63, "maximum": [2, 10, 13, 61, 63, 65], "maze": [16, 17, 18, 19, 20, 21, 30, 43, 44, 45, 46, 47, 48, 49, 50, 56, 61], "maze2d": [42, 61], "maze_map": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 61], "maze_solv": 61, "mb": [8, 12, 14, 55], "md": [1, 56], "mdp": [12, 56], "mean": [6, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 61, 63], "meant": [2, 56], "measur": [25, 29, 41, 54, 61], "medium": [12, 15, 42, 56], "memor": [15, 42], "memori": [2, 12, 56], "mention": [13, 56, 61, 65], "merg": 14, "messag": 14, "met": 7, "metadata": [2, 4, 7, 8, 10, 12, 14, 56, 60], "method": [12, 15, 42, 56, 58, 61, 63], "metric": 13, "mgoulao": 56, "microwav": [31, 32, 33, 34], "mimic": 15, "min": 63, "minari": [11, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 63, 65], "minari_autose": 2, "minari_data": 63, "minari_dataset": [56, 65], "minari_datasets_path": 13, "minari_remot": [12, 56], "minari_storag": 56, "minari_vers": [13, 56], "minaridataset": [2, 10, 12, 13, 56, 65], "minariexperiencereplai": 63, "minaristorag": [2, 7, 10, 13, 56], "minigrid": [30, 35, 36, 56, 58], "minim": 60, "minimis": 63, "minimum": [2, 10, 12, 13, 56], "minor": 56, "mirana": 60, "misc": 56, "miss": 56, "mission": [35, 36, 58], "mission_func": 58, "missionspac": [35, 36, 58], "missonspac": 58, "mix": [22, 25, 26, 29, 32, 38, 41, 51, 54, 56], "mlp": 63, "mode": 63, "modifi": [8, 12, 13, 56, 60], "modul": [58, 60, 61, 63, 65], "modulelist": 63, "moment": 13, "more": [1, 6, 12, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 61, 63], "more_dataset": 56, "moreov": [8, 13], "morpholog": 15, "most": [12, 14], "move": [12, 30, 32, 42, 54, 56, 61], "mp4": 63, "mujoco": [2, 10, 61], "multi": 63, "multipl": [10, 11, 12, 14, 56, 63], "must": [5, 7, 8, 10, 12, 13, 56, 63], "my": 12, "n": [7, 12, 13, 14, 61, 65], "n_episod": [7, 12], "n_step": [56, 61], "nail": 29, "name": [2, 10, 11, 12, 13, 14, 55, 56, 58, 65], "namespac": [2, 10, 56], "namespace_metadata": 13, "narrow": [25, 29, 41, 54], "nathan": [15, 42, 61], "navig": [15, 30, 37, 42], "ncol": 63, "ndarrai": [6, 7, 10, 13, 56], "necessari": 63, "need": [8, 12, 56, 58, 60, 61, 63, 65], "neg": [43, 45, 47, 49], "nest": [2, 5, 11, 13, 56], "net": 63, "network": [63, 65], "neural": 65, "never": [32, 33, 61, 63], "new": [2, 8, 10, 12, 16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 61, 63, 65], "new_dataset_id": [10, 56], "new_dataset_nam": 14, "newli": [10, 12, 63], "next": [9, 56, 61, 63, 65], "next_cel": 61, "next_episode_id": 56, "next_stat": 61, "nightli": 63, "nn": [63, 65], "no_grad": 63, "noah": 15, "nois": [43, 44, 45, 46, 47, 48, 49, 50, 56, 61], "non": [12, 13, 15, 42], "nondeterminist": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "none": [2, 3, 5, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61], "nonetyp": 56, "noqa": 58, "norm": 61, "normal": [2, 63], "normalized_scor": 10, "normalparamextractor": 63, "note": [10, 11, 13, 16, 17, 18, 19, 20, 21, 60, 61, 63], "notebook": [58, 60, 61, 62, 63, 65], "notic": 12, "notimplementederror": 58, "now": [10, 12, 56, 58, 60, 61, 65], "np": [7, 10, 13, 56, 60, 61, 63, 65], "npt": 7, "nrow": 63, "num_act": 61, "num_cel": 63, "num_episod": [58, 60], "num_episodes_average_scor": [2, 10], "num_epoch": 65, "num_eval_episod": 63, "num_itr": 61, "num_stat": 61, "num_step": 2, "number": [2, 6, 7, 10, 12, 13, 14, 56], "numpi": [60, 61, 63, 65], "o": 65, "ob": [2, 5, 12, 56, 61, 65], "object": [7, 8, 9, 12, 25, 29, 32, 37, 41, 54, 56, 58, 63, 65], "observ": [2, 3, 5, 6, 8, 9, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "observation_spac": [2, 8, 10, 12, 13, 56, 58, 60, 65], "observation_space_subset": 60, "obstyp": [2, 10], "obtain": [22, 25, 26, 29, 38, 41, 51, 54, 61], "occur": [16, 17, 18, 19, 20, 21], "off": 14, "offici": 56, "offlin": [12, 13, 14, 55, 56, 61, 63, 65], "often": 61, "oibserv": 56, "omar": [35, 36], "omit": 60, "onc": [1, 12, 61, 63, 65], "one": [2, 6, 7, 8, 12, 25, 29, 41, 42, 54, 56, 63], "one_hot": 65, "onli": [10, 11, 12, 13, 42, 44, 46, 47, 48, 50, 56, 60, 63], "onlin": 63, "onto": 11, "open": [25, 32, 42, 56, 63], "opengl": 63, "optim": [61, 65], "option": [2, 3, 5, 7, 8, 10, 12, 13, 14, 56], "order": [12, 31, 32, 56, 60], "order_enforc": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "org": [11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 61, 65], "organ": 56, "orient": [5, 41, 60], "origin": [10, 12, 25, 29, 30, 32, 41, 42, 54, 56, 58, 63], "other": [7, 8, 10, 11, 12, 13, 14, 32, 34, 56, 60, 61, 63], "otherwis": [7, 12, 44, 46, 48, 50, 56], "our": [1, 12, 13, 56, 60, 61, 63, 65], "ourselv": 61, "out": [8, 12, 56, 58, 61, 63], "out_featur": 63, "out_kei": 63, "outlin": 60, "output": [8, 58, 60, 61, 63, 65], "output_dim": 65, "outsid": 63, "over": [2, 7, 10, 12, 61, 63], "overal": 63, "overconfid": 63, "overestim": 63, "overrid": [4, 5, 13, 14, 61], "overridden": [4, 5, 10, 56], "overridng": 61, "overshoot": 61, "overview": 63, "overwrit": 11, "own": [10, 12, 56, 61], "p_": 61, "packag": [1, 2, 10, 14, 56, 65], "pad": 65, "pad_sequ": 65, "page": 56, "page_facing_up": 56, "pair": [13, 63], "paper": [25, 29, 41, 54], "paramet": [2, 3, 4, 5, 7, 8, 10, 11, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 63, 65], "parameteris": 63, "part": 63, "partial": [32, 56], "particular": [58, 63], "pass": [2, 4, 7, 10, 12, 60, 63], "past": 56, "path": [8, 11, 12, 13, 14, 43, 44, 45, 46, 47, 48, 49, 50, 56, 61, 65], "path_str": 14, "pathlik": [7, 8], "pbar": 63, "pd": [42, 43, 44, 45, 46, 47, 48, 49, 50, 61], "pen": [14, 30, 38, 39, 40, 56], "per": [2, 56], "perceptron": 63, "perez": [43, 44, 45, 46, 47, 48, 49, 50, 61], "perform": [9, 10, 12, 14, 32, 33, 34, 61, 63, 65], "perimet": [42, 47, 48], "permalink": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "perman": 12, "pettingzoo": 56, "phi": 63, "pi": [61, 63], "pi_": 63, "pick": [16, 18], "pid": [56, 61], "pip": [1, 2, 10, 12, 13, 14, 55, 58, 63, 65], "pixel": 63, "pixels_onli": 63, "plai": [12, 15], "plan": [12, 56, 60], "planner": [15, 42], "platform": 13, "pleas": [11, 12, 56, 60], "plot": 63, "plt": 63, "plug": 63, "point": [7, 30, 56, 63], "point_maz": [43, 44, 45, 46, 47, 48, 49, 50], "point_maze_dataset": [56, 61], "pointmaz": [15, 30, 43, 44, 45, 46, 47, 48, 49, 50, 56, 59, 60, 62], "pointmaze_larg": [42, 44], "pointmaze_largedens": [42, 43], "pointmaze_medium": [42, 46, 61], "pointmaze_mediumdens": [42, 45], "pointmaze_open": [42, 48], "pointmaze_opendens": [42, 47], "pointmaze_umaz": [42, 50, 60], "pointmaze_umazedens": [42, 49], "pointmazeenv": [43, 44, 45, 46, 47, 48, 49, 50], "pointmazestepdatacallback": 61, "pole": 65, "polici": [2, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 29, 30, 32, 36, 37, 38, 39, 41, 42, 51, 52, 54, 61, 63], "policy_net": 65, "policynetwork": 65, "polyak": 63, "poorli": 63, "popul": 63, "popular": 55, "pose": [5, 61], "posit": [5, 32, 37, 54, 61, 63], "possibl": [13, 56], "ppo": 65, "pr": 56, "practic": 63, "pre": 56, "precis": 63, "precommit": 56, "predict": [61, 65], "prepend": 11, "preprint": 32, "prerequisit": 63, "present": [10, 15, 30, 65], "prevent": 12, "previou": [2, 12, 56], "previous": [15, 56, 61, 65], "principl": 30, "print": [12, 56, 58, 60, 63, 65], "prng": 2, "probabilisticactor": 63, "probabl": 61, "problem": 65, "proce": [14, 65], "procedur": 60, "process": [12, 56, 61, 63], "prod": 65, "produc": 56, "program": 61, "progress": 14, "project": [12, 56], "prompt": [12, 14], "properli": [58, 63], "properti": [7, 63], "proporti": 61, "provid": [10, 12, 13, 14, 15, 16, 18, 22, 23, 24, 25, 26, 27, 28, 29, 30, 38, 39, 40, 41, 51, 52, 53, 54, 55, 56, 63], "pseudo": 56, "psi": 63, "public": [13, 56, 61], "publicli": 55, "pure": 56, "purpos": [12, 30, 42, 61, 63], "py": [56, 58, 60, 61, 63, 65], "pyarrow": 56, "pypi": 56, "pyplot": 63, "pyright": 56, "pytest": 56, "python": [12, 55, 56, 58, 60, 61, 62, 63, 65], "python3": 63, "pytorch": [56, 62, 63, 66], "pytorchdataload": 56, "pyvirtualdisplai": 63, "pz": 56, "q": [61, 62, 66], "q_": 63, "q_fn": 61, "q_iter": 61, "q_net": 63, "q_valu": 61, "qiter": [15, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61], "qpo": 61, "quadrup": [15, 30], "quantifi": 63, "queri": 63, "quick": 63, "quickli": 61, "quit": 63, "qvalu": 63, "qvel": 61, "r": [1, 16, 17, 18, 19, 20, 21, 61, 63], "r_t": 63, "raffin": 15, "rais": [8, 10], "rajeswaran": [25, 29, 41, 54], "randn": 61, "random": [2, 7, 10, 12, 17, 19, 20, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 58, 60, 61, 63, 65], "random_polici": [58, 60], "randomis": 63, "randomli": [12, 13, 42, 58, 61], "randompolici": 35, "rang": [2, 10, 12, 56, 58, 60, 61, 63, 65], "rate": [16, 17, 18, 19, 20, 21, 61], "rather": 63, "ratio": [22, 25, 26, 29, 38, 41, 51, 54], "rb": 63, "re": [56, 61], "reach": [15, 16, 17, 18, 19, 20, 21, 32, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 61], "read": [8, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 63], "readabl": 13, "readi": 56, "readm": 56, "real": 15, "reason": 61, "rebuild": 1, "receiv": 65, "recent": [12, 63], "recommend": 12, "record": [2, 12, 56, 60, 61], "record_info": [2, 12, 13, 61], "recov": [2, 7, 10, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 63], "recover_env": 56, "recover_environ": [2, 7, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 65], "recoveri": 56, "redtachyon": 56, "reduc": [56, 61], "ref": 10, "ref_max_scor": [2, 10], "ref_min_scor": [2, 10], "refactor": [56, 61], "refer": [2, 10, 30, 56], "referenc": 56, "regener": 37, "regist": 58, "registr": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "registri": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "reinforc": [12, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 55, 61], "rel": 56, "relai": [30, 32], "releas": 11, "relev": [2, 10, 12], "reliabl": 15, "reloc": [30, 51, 52, 53, 56], "relu": [63, 65], "rememb": 63, "remot": [10, 11, 12, 13, 14, 55, 56], "remov": [12, 56], "remove_task_when_complet": [31, 33, 34], "renam": 56, "render": 63, "render_mod": 65, "reorgan": 56, "replac": [15, 30, 61], "replai": [12, 56], "replay_buff": 63, "repositori": [10, 13, 14, 23, 24, 25, 27, 28, 29, 30, 32, 39, 40, 41, 52, 53, 54], "repres": [13, 58, 63], "represent": 56, "reproduc": [2, 10, 12, 30, 37, 63, 65], "reproduct": [30, 56], "requir": [1, 2, 10, 12, 13, 14, 56, 58, 60, 61, 63, 65], "research": 15, "reset": [2, 12, 13, 16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 60, 61, 63, 65], "reset_target": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50], "resid": 11, "residu": 56, "respect": [10, 61, 63], "respond": 61, "respons": 12, "rest": 63, "restart": 63, "result": [10, 56, 58, 61], "results_video": 63, "retriev": [10, 12, 56], "return": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 44, 46, 48, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "rew": [2, 5, 12, 56, 61, 65], "rew_matrix": 61, "reward": [3, 5, 6, 12, 13, 15, 16, 17, 18, 19, 20, 21, 25, 29, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 56, 63, 65], "reward_funct": 61, "reward_threshold": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "reward_typ": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "rewards_max": 13, "rewards_mean": 13, "rewards_min": 13, "rewards_std": 13, "rewards_sum": 13, "right": [56, 61, 63], "rl": [12, 14, 23, 25, 27, 29, 39, 41, 52, 54, 56, 63, 65], "rl_zoo3": [56, 65], "rm": 63, "rnd": 56, "rnn": 65, "robot": [14, 15, 25, 29, 30, 41, 54, 56, 60, 61, 63], "rodrigo": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 61], "rodrigodelazcano": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "roll": 63, "rollout": 63, "root": [12, 13], "row": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "rperezvicent": [14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 61], "rugged": 56, "run": [12, 22, 25, 26, 29, 38, 41, 51, 54, 56, 63], "s_": 63, "s_t": 63, "sac": [15, 16, 17, 18, 19, 20, 21], "safe": 56, "same": [2, 7, 10, 12, 13, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56, 61, 63], "sampl": [2, 7, 13, 35, 37, 55, 56, 58, 60, 63], "sample_episod": [7, 12, 13, 56], "sampled_episod": 13, "sampler": 63, "samplerwithoutreplac": 63, "save": [4, 13, 56, 58, 60, 61, 63, 65], "save_video": 63, "scale": 63, "scale_lb": 63, "scenario": 65, "schedul": [12, 56], "score": [2, 63], "script": [14, 30, 63, 65], "second": [12, 56], "section": [13, 56, 63], "see": [13, 58, 63], "seed": [2, 3, 7, 10, 12, 13, 56, 58, 60, 61, 63, 65], "seen": 61, "select": [16, 17, 18, 19, 20, 25, 29, 41, 42, 54, 56, 61], "self": [2, 3, 4, 5, 7, 8, 60, 61, 65], "separ": 56, "sequenc": [32, 33, 34, 42], "sequenti": 63, "seri": [12, 61], "serial": [13, 56, 59, 62], "serializ": 13, "serialize_custom_spac": 58, "serialize_spac": 58, "serv": 12, "server": [10, 11, 12, 14, 55, 63], "servic": 56, "set": [2, 7, 10, 12, 13, 15, 16, 17, 18, 19, 20, 21, 56, 61, 63, 65], "set_descript": 63, "set_exploration_typ": 63, "set_se": [7, 12, 63], "set_titl": 63, "set_xlabel": 63, "setpoint": 61, "sever": 13, "shape": [15, 20, 21, 42, 49, 50, 56, 60, 61, 63, 65], "shard": 12, "share": [56, 63], "shift": [13, 63], "should": [2, 58, 60], "show": [12, 55, 56, 58, 60, 63], "shown": [14, 63], "shreyansjainn": 56, "shuffl": 65, "sim": 63, "similarli": [56, 63], "simpl": [12, 56, 61, 63, 65], "simplefilt": 63, "simpli": [58, 61], "sinc": [58, 61, 65], "singl": [3, 6, 9, 10, 12, 14, 56, 63], "size": [8, 10, 12, 14, 55, 56, 61, 63], "skip": [10, 63], "slash": [11, 13], "slice": [7, 8], "slide": [31, 32, 33, 34], "slightli": 56, "slowli": [61, 63], "small": [56, 63], "smaller": [42, 56, 61], "snippet": 12, "so": [12, 13, 61, 63], "soft": 63, "softupd": 63, "solut": 61, "solv": [32, 61], "solver": 61, "some": [2, 8, 12, 14, 56, 58, 61, 63], "sourc": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 56, 58, 60, 61, 62, 63, 65], "space": [2, 8, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 59, 61, 62, 63, 65], "space_dict": 58, "spars": [15, 16, 17, 18, 19, 20, 21, 25, 29, 41, 42, 44, 46, 48, 50, 54], "spec": [2, 7, 10, 13, 14, 56, 58, 63], "specif": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 60, 61, 63], "specifi": [2, 7, 8, 12, 13, 56, 63], "speed": [56, 61], "sphinx": 1, "sphinx_github_changelog_token": 56, "sphx": 56, "split": [42, 56], "split_dataset": [10, 12, 56], "split_traj": 63, "squar": 58, "src": 63, "stabil": 61, "stabl": 15, "stable_baselines3": 65, "stack": [6, 13, 56], "stand": [16, 17, 18, 19, 20, 21], "standard": [12, 56, 63], "start": [12, 13, 58, 60, 61, 63, 65], "state": [2, 32, 42, 61, 63], "state_action_valu": 63, "state_to_cel": 61, "state_valu": 63, "statist": 4, "steadi": 61, "step": [2, 3, 5, 6, 7, 8, 9, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 60, 61, 63, 65], "step_data": [3, 5, 60, 61], "step_data_callback": [2, 60, 61], "step_data_kei": 5, "stepdata": [3, 5], "stepdatacallback": [2, 13, 56, 59, 62], "stitch": 15, "storag": [8, 12, 13, 56], "store": [2, 8, 10, 12, 13, 56, 60, 63], "str": [2, 5, 8, 9, 10, 11, 13, 58], "straight": [36, 37], "strictli": 63, "string": [11, 13, 58], "stronger": 61, "structur": [11, 12, 56], "style": [2, 10, 13, 56, 63], "sub": [14, 56], "subcomponent_1": 56, "subcomponent_2": 56, "subdirectori": 13, "subgroup": [56, 61], "subplot": 63, "subsequ": 56, "subset": [56, 59, 62], "subtask": [31, 32, 33, 34], "subtrajectori": [32, 34], "succ": 61, "success": [16, 17, 18, 19, 20, 21, 61, 65], "successfulli": [14, 60], "sudo": 63, "suggest": 56, "sum": 63, "sum_": 61, "summari": 63, "super": [5, 60, 61, 65], "support": [2, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61, 63], "supportsfloat": 2, "suppos": 12, "sure": [14, 56], "surrog": 13, "switch": [31, 32, 33, 34], "sy": 65, "syntax": [2, 10, 13], "system": 61, "t": [2, 8, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 56, 58, 60, 61, 63], "tabl": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56], "tackl": 63, "take": [7, 13, 58, 61], "taken": [6, 8, 43, 44, 45, 46, 47, 48, 49, 50, 60], "tanh": 63, "tanh_loc": 63, "tanhnorm": 63, "target": [16, 17, 18, 19, 20, 21, 30, 31, 32, 33, 34, 42, 54, 61, 63], "target_net_updat": 63, "task": [10, 12, 15, 25, 29, 32, 34, 41, 43, 44, 45, 46, 47, 48, 49, 50, 54, 61, 63, 65], "tasks_to_complet": [31, 33, 34], "tau": [61, 63], "td": 63, "team": 11, "temperatur": 63, "templat": 56, "tempor": 63, "temporari": [2, 12, 56, 61], "tensor": [63, 65], "tensordict": 63, "tensordictmodul": 63, "termin": [2, 3, 5, 6, 7, 9, 12, 13, 16, 17, 18, 19, 20, 21, 42, 56, 58, 60, 61, 63, 65], "terminate_on_tasks_complet": [31, 33, 34], "test": [10, 11, 12, 15, 56, 60], "text": [13, 35, 36, 56, 61], "than": [10, 12, 16, 17, 18, 19, 20, 21, 56, 63], "thank": 56, "thei": [8, 13, 30, 56, 63], "them": [12, 13, 56, 65], "theme": 61, "theori": 61, "therefor": 63, "theta": 63, "thi": [1, 2, 4, 5, 6, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 56, 58, 60, 61, 63, 65], "thing": [56, 58], "think": 61, "thorough": 56, "those": 63, "thought": 56, "three": [25, 29, 41, 54, 61, 63], "through": [12, 13, 14, 55, 56, 61, 63], "thu": [42, 61], "tight_layout": 63, "time": [1, 2, 10, 61], "timestep": 56, "to_str": 58, "togeth": [10, 12, 14, 32, 33, 63], "tohsin": 56, "tomekst": 56, "tool": [14, 29, 56], "top": [13, 14, 31, 33, 34], "torch": [63, 65], "torchrl": [62, 66], "total": [7, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 61, 63], "total_episod": [7, 8, 12, 13, 56, 65], "total_step": [7, 8, 12, 13, 56, 61], "total_timestep": 56, "touch": [11, 60], "toward": 61, "towardsdatasci": [15, 42, 61], "tqdm": [63, 65], "train": [15, 16, 17, 18, 19, 20, 21, 22, 25, 26, 29, 38, 41, 51, 54, 60], "trainer": 63, "trajectori": [14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 29, 39, 41, 42, 52, 54, 55, 56, 61], "transform": 63, "transformedenv": 63, "transit": [5, 56, 61, 63], "transition_matrix": 61, "tri": 63, "true": [2, 7, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61, 63, 65], "truncat": [2, 3, 5, 6, 9, 12, 13, 42, 56, 58, 60, 61, 63, 65], "try": [58, 63], "tune": [14, 23, 25, 27, 29, 39, 41, 52, 54, 61, 63], "tupl": [2, 3, 13, 56, 61, 63], "tutori": [56, 58, 60, 61, 63, 65], "tutorials_jupyt": 62, "tutorials_python": 62, "two": [10, 12, 13, 14, 25, 29, 41, 42, 54, 56, 63, 65], "txt": 1, "type": [2, 12, 13, 25, 29, 41, 54, 56, 58, 63, 65], "typer": 14, "typic": 61, "typing_extens": 56, "typo": 56, "u": [14, 15, 20, 21, 42, 49, 50, 56, 63, 65], "uint8": [35, 36, 58, 63], "umaz": [15, 42, 56, 61], "under": [10, 13, 42, 56, 63], "undiscount": [10, 13], "unflatten": 56, "unifi": 56, "uniform": 61, "union": [7, 58], "uniqu": 58, "unknown": 56, "unless": 2, "unlik": 63, "until": [12, 43, 44, 45, 46, 47, 48, 49, 50], "up": [12, 16, 17, 18, 19, 20, 21, 56, 58, 60, 61, 63, 65], "updat": [2, 8, 12, 56, 61, 63], "update_dataset_from_buff": 7, "update_dataset_from_collector_env": 56, "update_episod": 8, "update_episode_metadata": 8, "update_from_storag": 8, "update_metadata": 8, "upgrad": 63, "upload": 56, "upload_namespac": 11, "upon": 15, "upper": 13, "us": [2, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "usag": [14, 56], "user": [2, 12, 13, 56], "usual": 63, "util": [10, 12, 55, 63, 65], "v": [2, 10, 13, 14, 32, 63], "v0": [10, 11, 12, 13, 35, 36, 37, 58, 60, 61, 65], "v1": [10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 39, 40, 41, 51, 52, 53, 54, 56, 63, 65], "v1_1": 65, "v2": [12, 13, 14, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 63], "v3": [42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 60, 61], "v4": [15, 16, 17, 18, 19, 20, 21], "v_": [61, 63], "v_fn": 61, "valid": [10, 60, 61, 63], "valu": [2, 5, 6, 8, 9, 10, 12, 13, 44, 46, 48, 50, 56, 61, 63], "value_net": 63, "value_network": 63, "valueerror": 8, "valueoper": 63, "vari": [58, 63, 65], "variabl": [12, 13, 56, 61], "varianc": [43, 44, 45, 46, 47, 48, 49, 50, 61], "variat": 61, "varieti": 12, "variou": [32, 33, 58], "ve": 61, "vector_entry_point": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "veloc": [5, 42, 61], "veri": 12, "version": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 60, 61], "via": [32, 63], "vicent": [43, 44, 45, 46, 47, 48, 49, 50, 61], "video": 63, "video_fold": 63, "viewer_env": 63, "virtual": 63, "virtual_displai": 63, "visibl": 63, "visual": 65, "visualis": 63, "vol": [15, 25, 29, 30, 32, 37, 41, 42, 54, 61], "wa": [2, 7, 10, 13, 15, 25, 29, 35, 36, 37, 41, 54, 56, 58], "wai": [12, 61, 63], "wall": [42, 47, 48, 61], "want": [7, 12, 14, 61], "wapoint": 61, "warn": [14, 56, 63], "waypoint": [15, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50], "waypoint_control": 61, "waypoint_target": 61, "waypoint_threshold": 61, "waypointcontrol": 61, "wd": 56, "we": [12, 13, 30, 37, 56, 58, 60, 61, 63, 65], "weight": 63, "well": [12, 13, 14, 55, 56, 61, 63], "were": [10, 12, 14, 25, 29, 30, 32, 41, 42, 54, 56], "what": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 61], "when": [7, 12, 13, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50, 56, 58, 60, 61, 63], "where": [2, 8, 10, 13, 32, 34, 56, 61, 63], "whether": 11, "which": [2, 7, 8, 10, 12, 13, 15, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 60, 61, 63, 65], "while": [12, 56, 58, 60, 61, 63, 65], "who": 63, "whose": 63, "willdudlei": 56, "window": 56, "within": [7, 56, 63], "without": [43, 44, 45, 46, 47, 48, 49, 50, 56], "won": [12, 61], "work": [2, 12, 14, 56, 63], "workflow": 56, "world": 15, "worri": 58, "would": [11, 13, 14, 60, 61], "wrap": [2, 12, 56, 61, 63], "wrapper": [2, 4, 12, 13, 56, 58, 61, 63, 65], "write": [8, 63], "written": 63, "x": [7, 30, 42, 61, 65], "xvfb": 63, "xy": 61, "y": [14, 30, 42, 61, 63], "yml": 56, "you": [7, 8, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 56, 58, 60, 61, 63, 65], "youni": [35, 36], "younik": 56, "younis98": 36, "your": [12, 14, 56, 65], "zero": 61, "zero_grad": [63, 65], "zip": 62, "zoo": 65, "\u898b\u7fd2\u3044": 55}, "titles": ["404 - Page Not Found", "Minari documentation", "DataCollector", "EpisodeBuffer", "EpisodeMetadataCallback", "StepDataCallback", "EpisodeData", "MinariDataset", "MinariStorage", "StepData", "Minari", "Namespace", "Basic Usage", "Dataset Standards", "Minari CLI", "Ant Maze", "Large-Diverse", "Large-Play", "Medium-Diverse", "Medium-Play", "Umaze-Diverse", "Umaze", "Cloned", "Expert", "Human", "Door", "Cloned", "Expert", "Human", "Hammer", "D4RL", "Complete", "Kitchen", "Mixed", "Partial", "Fourrooms-Random", "Fourrooms", "MiniGrid", "Cloned", "Expert", "Human", "Pen", "Point Maze", "Large-Dense", "Large", "Medium-Dense", "Medium", "Open-Dense", "Open", "Umaze-Dense", "Umaze", "Cloned", "Expert", "Human", "Relocate", "<no title>", "Release Notes", "Dataset Creation", "Serializing a custom space", "Dataset Creation", "Collecting a subset of a dictionary space with StepDataCallback", "PointMaze D4RL dataset", "Tutorials", "Implicit Q-Learning with TorchRL", "Using Datasets", "Behavioral cloning with PyTorch", "Using Datasets"], "titleterms": {"0": 56, "1": [56, 61], "2": [56, 61], "3": [56, 61], "4": 56, "404": 0, "5": 56, "For": 63, "Not": 0, "The": [0, 63], "action": 13, "adroit": 63, "ant": 15, "attribut": [3, 6, 7, 8, 9], "basic": 12, "behavior": 65, "buffer": 63, "build": [1, 63], "checkpoint": 12, "cli": 14, "clone": [22, 26, 38, 51, 65], "collect": [12, 60, 61], "combin": [10, 12, 14], "complet": 31, "content": [15, 25, 29, 30, 32, 37, 41, 42, 54], "control": 61, "could": 0, "creat": [10, 11, 12, 61], "creation": [57, 59, 62], "custom": 58, "d": 61, "d4rl": [30, 61], "data": [12, 61], "data_collector": 3, "datacollector": 2, "dataset": [8, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 57, 59, 61, 62, 64, 65, 66], "defin": 63, "delet": [10, 11, 14], "dens": [43, 45, 47, 49], "deriv": 61, "descript": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "detail": 14, "dictionari": 60, "directori": 13, "divers": [16, 18, 20], "document": 1, "door": 25, "download": [10, 11, 12, 14], "environ": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 63], "episod": 12, "episodebuff": 3, "episodedata": [6, 13], "episodemetadatacallback": 4, "evalu": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "expert": [23, 27, 39, 52], "filter": 12, "found": 0, "fourroom": [35, 36], "gener": 65, "get": 11, "hammer": 29, "headless": 63, "human": [24, 28, 40, 53], "i": 61, "implicit": 63, "import": 65, "instal": 12, "integr": 61, "kitchen": 32, "larg": [16, 17, 43, 44], "learn": 63, "list": [10, 11, 14], "load": [10, 12], "local": [11, 12, 14], "loss": 63, "maze": [15, 42], "medium": [18, 19, 45, 46], "metadata": [11, 13], "method": [2, 3, 4, 5, 7, 8], "minari": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 61], "minari_storag": 8, "minaridataset": 7, "minaristorag": 8, "minigrid": 37, "mix": 33, "model": 63, "modifi": 61, "namespac": [11, 12, 13], "normal": 10, "note": 56, "observ": 13, "open": [47, 48], "optim": 63, "p": 61, "page": 0, "partial": 34, "pen": [41, 63], "plai": [17, 19], "planner": 61, "point": 42, "pointmaz": 61, "polici": 65, "pre": 63, "proport": 61, "pytorch": 65, "q": 63, "random": 35, "recov": 12, "refer": [15, 25, 29, 32, 37, 41, 42, 54, 61], "releas": 56, "reloc": 54, "replai": 63, "request": 0, "requisit": 63, "result": 63, "sampl": 12, "save": 12, "score": 10, "serial": 58, "show": 14, "space": [13, 58, 60], "spec": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "split": [10, 12], "standard": 13, "stepdata": 9, "stepdatacallback": [5, 60, 61], "structur": 13, "subset": 60, "support": 13, "term": 61, "torchrl": 63, "train": [63, 65], "tutori": 62, "umaz": [20, 21, 49, 50], "updat": 11, "upload": [11, 14], "us": [12, 62, 64, 66], "usag": 12, "v0": 56, "waypoint": 61}}) \ No newline at end of file