From 55447c3466163ae4e28cc8eddde49d9a989f60b2 Mon Sep 17 00:00:00 2001 From: jjshoots <38184875+jjshoots@users.noreply.github.com> Date: Tue, 2 Jul 2024 07:03:10 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20Farama-F?= =?UTF-8?q?oundation/PettingZoo@4d75d86d39e4b8f01d224d3875896087d1aae217?= =?UTF-8?q?=20=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- main/.buildinfo | 2 +- main/environments/third_party_envs/index.html | 14 ++++++++++++++ main/searchindex.js | 2 +- 3 files changed, 16 insertions(+), 2 deletions(-) diff --git a/main/.buildinfo b/main/.buildinfo index d3b88fb03..363d02e42 100644 --- a/main/.buildinfo +++ b/main/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: 67c8b61a8db4108a85565801bb598878 +config: 6ec1f81676ded56e0d75e900a4e17e0a tags: d77d1c0d9ca2f4c8421862c7c5a0d620 diff --git a/main/environments/third_party_envs/index.html b/main/environments/third_party_envs/index.html index 74201c3c0..e47712f50 100644 --- a/main/environments/third_party_envs/index.html +++ b/main/environments/third_party_envs/index.html @@ -405,6 +405,18 @@

Third-Party Environments

Environments using the latest versions of PettingZoo

Due to a very recent major release of PettingZoo, there are currently few contributed third-party environments. If you’d like to contribute one, please reach out on Discord.

+
+

gfootball-gymnasium-pettingzoo

+

PettingZoo version dependency +GitHub stars

+

Google Research Football (GRF) with Gymnasium and PettingZoo Compatibility.

+
+
+

SMAC and SMACv2 with latest PettingZoo APIs

+

PettingZoo version dependency +GitHub stars

+

SMAC and SMACv2 with the latest PettingZoo Parallel APIs.

+

Sumo-RL

PettingZoo version dependency @@ -649,6 +661,8 @@

Mu
  • Third-Party Environments
    • Environments using the latest versions of PettingZoo
        +
      • gfootball-gymnasium-pettingzoo
      • +
      • SMAC and SMACv2 with latest PettingZoo APIs
      • Sumo-RL
      • POGEMA
      • Racecar Gym
      • diff --git a/main/searchindex.js b/main/searchindex.js index 5cd69f5a3..ab9d69f70 100644 --- a/main/searchindex.js +++ b/main/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"0.18.1: 1.18.1": [[70, "release-0-18-1"]], "1.10.0": [[70, "release-1-10-0"]], "1.11.0": [[70, "release-1-11-0"]], "1.11.1": [[70, "release-1-11-1"]], "1.12.0": [[70, "release-1-12-0"]], "1.13.1": [[70, "release-1-13-1"]], "1.14.0": [[70, "release-1-14-0"]], "1.15.0": [[70, "release-1-15-0"]], "1.16.0": [[70, "release-1-16-0"]], "1.17.0": [[70, "release-1-17-0"]], "1.19.0": [[70, "release-1-19-0"]], "1.19.1": [[70, "release-1-19-1"]], "1.20.0": [[70, "release-1-20-0"]], "1.20.1": [[70, "release-1-20-1"]], "1.21.0": [[70, "release-1-21-0"]], "1.22.0": [[70, "release-1-22-0"]], "1.22.1": [[70, "release-1-22-1"]], "1.22.2": [[70, "release-1-22-2"]], "1.22.3": [[70, "release-1-22-3"]], "1.22.4": [[70, "release-1-22-4"]], "1.4.0": [[70, "release-1-4-0"]], "1.4.2": [[70, "release-1-4-2"]], "1.5.0": [[70, "release-1-5-0"]], "1.5.1": [[70, "release-1-5-1"]], "1.5.2": [[70, "release-1-5-2"]], "1.6.0": [[70, "release-1-6-0"]], "1.6.1": [[70, "release-1-6-1"]], "1.7.0": [[70, "release-1-7-0"]], "1.8.0": [[70, "release-1-8-0"]], "1.8.1": [[70, "release-1-8-1"]], "1.8.2": [[70, "release-1-8-2"]], "1.9.0": [[70, "release-1-9-0"]], "404 - Page Not Found": [[0, "page-not-found"]], "AEC": [[14, "aec"], [15, "aec"], [16, "aec"], [17, "aec"], [18, "aec"], [19, "aec"], [20, "aec"], [21, "aec"], [22, "aec"], [23, "aec"], [24, "aec"], [25, "aec"], [26, "aec"], [27, "aec"], [28, "aec"], [29, "aec"], [30, "aec"], [31, "aec"], [32, "aec"], [33, "aec"], [34, "aec"], [35, "aec"], [36, "aec"], [37, "aec"], [39, "aec"], [40, "aec"], [41, "aec"], [43, "aec"], [44, "aec"], [45, "aec"], [46, "aec"], [47, "aec"], [48, "aec"], [49, "aec"], [50, "aec"], [51, "aec"], [52, "aec"], [55, "aec"], [56, "aec"], [57, "aec"], [58, "aec"], [59, "aec"], [60, "aec"], [61, "aec"], [62, "aec"], [63, "aec"], [65, "aec"], [66, "aec"], [67, "aec"]], "AEC API": [[2, "aec-api"]], "AEC to Parallel": [[6, "module-pettingzoo.utils.conversions"]], "AECEnv": [[2, "aecenv"]], "API": [[14, "api"], [15, "api"], [16, "api"], [17, "api"], [18, "api"], [19, "api"], [20, "api"], [21, "api"], [22, "api"], [23, "api"], [24, "api"], [25, "api"], [26, "api"], [27, "api"], [28, "api"], [29, "api"], [30, "api"], [31, "api"], [32, "api"], [33, "api"], [34, "api"], [35, "api"], [36, "api"], [37, "api"], [39, "api"], [40, "api"], [41, "api"], [43, "api"], [44, "api"], [45, "api"], [46, "api"], [47, "api"], [48, "api"], [49, "api"], [50, "api"], [51, "api"], [52, "api"], [55, "api"], [56, "api"], [57, "api"], [58, "api"], [59, "api"], [60, "api"], [61, "api"], [62, "api"], [63, "api"], [65, "api"], [66, "api"], [67, "api"]], "API Test": [[11, "api-test"]], "About AEC": [[2, "about-aec"]], "Action Masking": [[2, "action-masking"]], "Action Masking Agent": [[86, "action-masking-agent"]], "Action Space": [[15, "action-space"], [16, "action-space"], [17, "action-space"], [18, "action-space"], [19, "action-space"], [20, "action-space"], [23, "action-space"], [24, "action-space"], [25, "action-space"], [26, "action-space"], [31, "action-space"], [33, "action-space"], [37, "action-space"], [43, "action-space"], [44, "action-space"], [45, "action-space"], [46, "action-space"], [47, "action-space"], [48, "action-space"], [49, "action-space"], [50, "action-space"], [51, "action-space"], [52, "action-space"], [54, "action-space"], [67, "action-space"]], "Action Space (Minimal)": [[14, "action-space-minimal"], [21, "action-space-minimal"], [22, "action-space-minimal"], [27, "action-space-minimal"], [28, "action-space-minimal"], [29, "action-space-minimal"], [30, "action-space-minimal"], [32, "action-space-minimal"], [34, "action-space-minimal"], [35, "action-space-minimal"], [36, "action-space-minimal"]], "Additional Environment API": [[9, "additional-environment-api"]], "Advanced: Additional (optional) files": [[78, "advanced-additional-optional-files"]], "Agent Selector": [[4, "agent-selector"]], "Agent selector": [[10, "agent-selector"]], "AgileRL Overview": [[74, "agilerl-overview"]], "AgileRL Tutorial": [[74, "agilerl-tutorial"]], "AgileRL: Implementing DQN - Curriculum Learning and Self-play": [[71, "agilerl-implementing-dqn-curriculum-learning-and-self-play"]], "AgileRL: Implementing MADDPG": [[72, "agilerl-implementing-maddpg"]], "AgileRL: Implementing MATD3": [[73, "agilerl-implementing-matd3"]], "Architecture": [[88, "architecture"], [96, "architecture"]], "Arguments": [[39, "arguments"], [40, "arguments"], [41, "arguments"], [45, "arguments"], [46, "arguments"], [49, "arguments"], [50, "arguments"], [51, "arguments"], [55, "arguments"], [56, "arguments"], [57, "arguments"], [58, "arguments"], [59, "arguments"], [60, "arguments"], [61, "arguments"], [62, "arguments"], [63, "arguments"], [65, "arguments"], [66, "arguments"], [67, "arguments"]], "Atari": [[13, "atari"]], "Attributes": [[2, "attributes"]], "Average Total Reward": [[4, "module-pettingzoo.utils.average_total_reward"]], "Basic Usage": [[9, "basic-usage"]], "Basketball Pong": [[14, "basketball-pong"]], "BomberManAI": [[68, "bombermanai"]], "Boxing": [[15, "boxing"]], "Breakout-Clone": [[68, "breakout-clone"]], "Build the Documentation": [[1, "build-the-documentation"]], "Butterfly": [[38, "butterfly"]], "Can I use it?": [[71, "can-i-use-it"], [72, "can-i-use-it"], [73, "can-i-use-it"]], "Capture Stdout": [[4, "capture-stdout"]], "Carla Gym": [[68, "carla-gym"]], "Cathedral-RL": [[68, "cathedral-rl"]], "Checking if the entire environment is done": [[9, "checking-if-the-entire-environment-is-done"]], "Chess": [[43, "chess"]], "Citation": [[7, "citation"], [8, "citation"], [13, "citation"], [54, "citation"]], "Classic": [[42, "classic"]], "CleanRL Overview": [[77, "cleanrl-overview"]], "CleanRL Tutorial": [[77, "cleanrl-tutorial"]], "CleanRL: Advanced PPO": [[75, "cleanrl-advanced-ppo"]], "CleanRL: Implementing PPO": [[76, "cleanrl-implementing-ppo"]], "Code": [[71, "code"], [72, "code"], [73, "code"], [75, "code"], [76, "code"], [79, "code"], [80, "code"], [81, "code"], [87, "code"], [89, "code"], [90, "code"], [92, "code"], [93, "code"], [94, "code"], [95, "code"], [97, "code"]], "Combat: Plane": [[16, "combat-plane"]], "Combat: Tank": [[17, "combat-tank"]], "Common Parameters": [[13, "common-parameters"]], "Config files": [[71, "config-files"]], "Connect Four": [[44, "connect-four"]], "Conversion wrappers": [[6, "conversion-wrappers"]], "CookingZoo": [[68, "cookingzoo"]], "Cooperative Pong": [[39, "cooperative-pong"]], "Crazy-RL": [[68, "crazy-rl"]], "Curriculum Learning": [[71, "curriculum-learning"]], "Curriculum learning and self-play using DQN on Connect Four": [[71, "curriculum-learning-and-self-play-using-dqn-on-connect-four"]], "Custom Environment Tutorial": [[83, "custom-environment-tutorial"]], "Cyber Operations Research Gym": [[68, "cyber-operations-research-gym"]], "DSSE: Drone Swarm Search Environment": [[68, "dsse-drone-swarm-search-environment"]], "DeepMind Control Soccer": [[7, "deepmind-control-soccer"]], "DeepMind Melting Pot": [[7, "deepmind-melting-pot"]], "Deprecated Module": [[10, "deprecated-module"]], "Developer Utils": [[10, "developer-utils"]], "Double Dunk": [[18, "double-dunk"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Emtombed: Competitive": [[19, "emtombed-competitive"]], "Emtombed: Cooperative": [[20, "emtombed-cooperative"]], "EnvLogger": [[4, "envlogger"]], "Environment Creation": [[10, "environment-creation"]], "Environment Details": [[13, "environment-details"]], "Environment Loop": [[86, "environment-loop"]], "Environment Setup": [[71, "environment-setup"], [72, "environment-setup"], [73, "environment-setup"], [75, "environment-setup"], [76, "environment-setup"], [86, "environment-setup"], [87, "environment-setup"], [89, "environment-setup"], [90, "environment-setup"], [92, "environment-setup"], [93, "environment-setup"], [94, "environment-setup"], [95, "environment-setup"], [97, "environment-setup"]], "Environment arguments": [[47, "environment-arguments"]], "Environment as an Agent": [[9, "environment-as-an-agent"]], "Environment parameters": [[14, "environment-parameters"], [15, "environment-parameters"], [16, "environment-parameters"], [17, "environment-parameters"], [18, "environment-parameters"], [19, "environment-parameters"], [20, "environment-parameters"], [21, "environment-parameters"], [22, "environment-parameters"], [23, "environment-parameters"], [24, "environment-parameters"], [25, "environment-parameters"], [26, "environment-parameters"], [27, "environment-parameters"], [28, "environment-parameters"], [29, "environment-parameters"], [30, "environment-parameters"], [31, "environment-parameters"], [32, "environment-parameters"], [33, "environment-parameters"], [34, "environment-parameters"], [35, "environment-parameters"], [36, "environment-parameters"], [37, "environment-parameters"]], "Environments using older versions of PettingZoo": [[68, "environments-using-older-versions-of-pettingzoo"]], "Environments using the latest versions of PettingZoo": [[68, "environments-using-the-latest-versions-of-pettingzoo"]], "Environments:": [[88, "environments"]], "Example Custom Environment": [[10, "example-custom-environment"]], "Example Custom Parallel Environment": [[10, "example-custom-parallel-environment"]], "Examples": [[2, "examples"], [3, "examples"]], "Examples using PettingZoo": [[74, "examples-using-pettingzoo"], [96, "examples-using-pettingzoo"]], "Examples using PettingZoo:": [[77, "examples-using-pettingzoo"], [88, "examples-using-pettingzoo"]], "Expanded Game": [[49, "expanded-game"], [49, "id3"]], "Fanorona AEC": [[68, "fanorona-aec"]], "Flag Capture": [[21, "flag-capture"]], "Foozpong": [[22, "foozpong"]], "Full Code": [[86, "full-code"]], "Full training code": [[71, "full-training-code"]], "Galaga AI": [[68, "galaga-ai"]], "Games Overview": [[13, "games-overview"]], "General setup": [[71, "general-setup"]], "Gin Rummy": [[45, "gin-rummy"]], "Go": [[46, "go"]], "Gobblet-RL": [[68, "gobblet-rl"]], "Gymnasium Agent": [[86, "gymnasium-agent"]], "Hanabi": [[47, "hanabi"]], "Ice Hockey": [[23, "ice-hockey"]], "Image-based": [[40, "image-based"]], "Imports": [[71, "imports"]], "Included Functions": [[8, "included-functions"]], "Included Multi-Agent Only Functions": [[8, "included-multi-agent-only-functions"]], "Initializing Environments": [[9, "initializing-environments"]], "Installation": [[9, "installation"], [13, "installation"], [38, "installation"], [42, "installation"], [54, "installation"], [64, "installation"]], "Interacting With Environments": [[9, "interacting-with-environments"]], "Interactive Connect Four": [[68, "interactive-connect-four"]], "Introduction": [[78, "introduction"], [79, "introduction"], [80, "introduction"], [81, "introduction"]], "Joust": [[24, "joust"]], "Kaggle Environments": [[68, "kaggle-environments"]], "Key Concepts": [[54, "key-concepts"]], "Knights Archers Zombies (\u2018KAZ\u2019)": [[40, "knights-archers-zombies-kaz"]], "LangChain Overview": [[85, "langchain-overview"]], "LangChain Tutorial": [[85, "langchain-tutorial"]], "LangChain: Creating LLM agents": [[86, "langchain-creating-llm-agents"]], "Leduc Hold\u2019em": [[48, "leduc-hold-em"]], "Legal Actions Mask": [[43, "legal-actions-mask"], [44, "legal-actions-mask"], [45, "legal-actions-mask"], [46, "legal-actions-mask"], [47, "legal-actions-mask"], [48, "legal-actions-mask"], [50, "legal-actions-mask"], [51, "legal-actions-mask"], [52, "legal-actions-mask"]], "MATS Gym": [[68, "mats-gym"]], "MPE": [[54, "mpe"]], "Manual Control": [[39, "manual-control"], [40, "manual-control"], [66, "manual-control"]], "Mario Bros": [[25, "mario-bros"]], "Max Cycles Test": [[11, "max-cycles-test"]], "Maze Craze": [[26, "maze-craze"]], "Methods": [[2, "methods"]], "Mu Torere": [[68, "mu-torere"]], "Multi-Agent Compatibility Wrappers:": [[7, "multi-agent-compatibility-wrappers"]], "Multiwalker": [[65, "multiwalker"]], "Neural MMO": [[68, "neural-mmo"]], "Notable Idioms": [[9, "notable-idioms"]], "Observation Saving": [[4, "module-pettingzoo.utils.save_observation"]], "Observation Space": [[43, "observation-space"], [44, "observation-space"], [45, "observation-space"], [46, "observation-space"], [47, "observation-space"], [48, "observation-space"], [49, "observation-space"], [50, "observation-space"], [51, "observation-space"], [52, "observation-space"], [54, "observation-space"], [65, "observation-space"], [67, "observation-space"]], "OpenSpiel": [[7, "openspiel"]], "Optional API Components": [[9, "optional-api-components"]], "Othello": [[27, "othello"]], "POGEMA": [[68, "pogema"]], "Parallel": [[14, "parallel"], [15, "parallel"], [16, "parallel"], [17, "parallel"], [18, "parallel"], [19, "parallel"], [20, "parallel"], [21, "parallel"], [22, "parallel"], [23, "parallel"], [24, "parallel"], [25, "parallel"], [26, "parallel"], [27, "parallel"], [28, "parallel"], [29, "parallel"], [30, "parallel"], [31, "parallel"], [32, "parallel"], [33, "parallel"], [34, "parallel"], [35, "parallel"], [36, "parallel"], [37, "parallel"], [39, "parallel"], [40, "parallel"], [41, "parallel"], [49, "parallel"], [55, "parallel"], [56, "parallel"], [57, "parallel"], [58, "parallel"], [59, "parallel"], [60, "parallel"], [61, "parallel"], [62, "parallel"], [63, "parallel"], [65, "parallel"], [66, "parallel"], [67, "parallel"]], "Parallel API": [[3, "parallel-api"]], "Parallel API Test": [[11, "parallel-api-test"]], "Parallel to AEC": [[6, "module-pettingzoo.utils.conversions"]], "ParallelEnv": [[3, "parallelenv"]], "Performance Benchmark Test": [[11, "performance-benchmark-test"]], "PettingZoo 1.23.0": [[70, "release-1-23-0"]], "PettingZoo 1.23.1": [[70, "release-1-23-1"]], "PettingZoo 1.24.0": [[70, "release-1-24-0"]], "PettingZoo 1.24.1": [[70, "release-1-24-1"]], "PettingZoo 1.24.2": [[70, "release-1-24-2"]], "PettingZoo 1.24.3": [[70, "release-1-24-3"]], "PettingZoo Agent": [[86, "pettingzoo-agent"]], "PettingZoo Dilemma Envs": [[68, "pettingzoo-dilemma-envs"]], "PettingZoo Wrappers": [[6, "pettingzoo-wrappers"]], "PettingZoo docs": [[1, "pettingzoo-docs"]], "Pistonball": [[41, "pistonball"]], "Pong": [[28, "pong"]], "Preprocessing": [[13, "preprocessing"]], "Pursuit": [[66, "pursuit"]], "Quadrapong": [[29, "quadrapong"]], "RLlib Overview": [[88, "rllib-overview"]], "RLlib: DQN for Simple Poker": [[87, "rllib-dqn-for-simple-poker"]], "RLlib: PPO for Pistonball": [[89, "rllib-ppo-for-pistonball"]], "Racecar Gym": [[68, "racecar-gym"]], "Raw Environments": [[9, "raw-environments"]], "Ray RLlib Tutorial": [[88, "ray-rllib-tutorial"]], "Recommended start": [[12, "recommended-start"]], "Release Notes": [[70, "release-notes"]], "Render Test": [[11, "render-test"]], "Rendering": [[54, "rendering"]], "Rewards": [[43, "rewards"], [44, "rewards"], [45, "rewards"], [46, "rewards"], [47, "rewards"], [48, "rewards"], [49, "rewards"], [50, "rewards"], [51, "rewards"], [52, "rewards"], [67, "rewards"]], "Rock Paper Scissors": [[49, "rock-paper-scissors"]], "Rock, Paper, Scissors": [[49, "id1"], [49, "id2"]], "Rock-Paper-Scissors": [[86, "rock-paper-scissors"]], "SB3: Action Masked PPO for Connect Four": [[90, "sb3-action-masked-ppo-for-connect-four"]], "SB3: PPO for Knights-Archers-Zombies": [[92, "sb3-ppo-for-knights-archers-zombies"]], "SB3: PPO for Waterworld": [[93, "sb3-ppo-for-waterworld"]], "SISL": [[64, "sisl"]], "Save Observation Test": [[11, "save-observation-test"]], "Seed Test": [[11, "seed-test"]], "Self-play": [[71, "self-play"]], "Sequential Social Dilemma Games": [[68, "sequential-social-dilemma-games"]], "Shimmy Compatibility Wrappers": [[7, "shimmy-compatibility-wrappers"]], "Simple": [[55, "simple"]], "Simple Adversary": [[56, "simple-adversary"]], "Simple Crypto": [[57, "simple-crypto"]], "Simple Push": [[58, "simple-push"]], "Simple Reference": [[59, "simple-reference"]], "Simple Speaker Listener": [[60, "simple-speaker-listener"]], "Simple Spread": [[61, "simple-spread"]], "Simple Tag": [[62, "simple-tag"]], "Simple World Comm": [[63, "simple-world-comm"]], "Skeleton code": [[78, "skeleton-code"]], "Space Invaders": [[30, "space-invaders"]], "Space War": [[31, "space-war"]], "Stable-Baselines Overview": [[91, "stable-baselines-overview"]], "Stable-Baselines3 Tutorial": [[91, "stable-baselines3-tutorial"]], "Stone Ground Hearth Battles": [[68, "stone-ground-hearth-battles"]], "Sumo-RL": [[68, "sumo-rl"]], "Supersuit Wrappers": [[8, "supersuit-wrappers"]], "Supported multi-agent environments:": [[7, "supported-multi-agent-environments"]], "Surround": [[32, "surround"]], "Teamfight Tactics MuZero Agent": [[68, "teamfight-tactics-muzero-agent"]], "Tennis": [[33, "tennis"]], "Termination": [[54, "termination"]], "Test the documentation": [[1, "test-the-documentation"]], "Testing Environments": [[11, "testing-environments"]], "Testing other PettingZoo Classic environments": [[90, "testing-other-pettingzoo-classic-environments"]], "Texas Holdem\u2019 No Limit": [[86, "texas-holdem-no-limit"]], "Texas Hold\u2019em": [[50, "texas-hold-em"]], "Texas Hold\u2019em No Limit": [[51, "texas-hold-em-no-limit"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Third-Party Environments": [[68, "third-party-environments"]], "Tianshou Overview": [[96, "tianshou-overview"]], "Tianshou Tutorial": [[96, "tianshou-tutorial"]], "Tianshou: Basic API Usage": [[95, "tianshou-basic-api-usage"]], "Tianshou: CLI and Logging": [[94, "tianshou-cli-and-logging"]], "Tianshou: Training Agents": [[97, "tianshou-training-agents"]], "Tic Tac Toe": [[52, "tic-tac-toe"]], "Tic-Tac-Toe": [[86, "tic-tac-toe"]], "Train multiple agents using MADDPG": [[72, "train-multiple-agents-using-maddpg"], [73, "train-multiple-agents-using-maddpg"]], "Trained model weights": [[71, "trained-model-weights"]], "Training and Evaluation": [[90, "training-and-evaluation"], [92, "training-and-evaluation"], [93, "training-and-evaluation"]], "Training loop": [[71, "training-loop"]], "Training the RL agent": [[87, "training-the-rl-agent"], [89, "training-the-rl-agent"]], "Training:": [[88, "training"]], "Tree structure": [[78, "tree-structure"]], "Tutorial: Action Masking": [[80, "tutorial-action-masking"]], "Tutorial: Environment Logic": [[79, "tutorial-environment-logic"]], "Tutorial: Repository Structure": [[78, "tutorial-repository-structure"]], "Tutorial: Testing Your Environment": [[81, "tutorial-testing-your-environment"]], "Tutorials": [[12, "tutorials"]], "Types of Environments": [[54, "types-of-environments"]], "Unwrapping an environment": [[9, "unwrapping-an-environment"]], "Usage": [[2, "usage"], [3, "usage"], [7, "usage"], [13, "usage"], [14, "usage"], [15, "usage"], [16, "usage"], [17, "usage"], [18, "usage"], [19, "usage"], [20, "usage"], [21, "usage"], [22, "usage"], [23, "usage"], [24, "usage"], [25, "usage"], [26, "usage"], [27, "usage"], [28, "usage"], [29, "usage"], [30, "usage"], [31, "usage"], [32, "usage"], [33, "usage"], [34, "usage"], [35, "usage"], [36, "usage"], [37, "usage"], [38, "usage"], [39, "usage"], [40, "usage"], [41, "usage"], [42, "usage"], [43, "usage"], [44, "usage"], [45, "usage"], [46, "usage"], [47, "usage"], [48, "usage"], [49, "usage"], [50, "usage"], [51, "usage"], [52, "usage"], [54, "usage"], [55, "usage"], [56, "usage"], [57, "usage"], [58, "usage"], [59, "usage"], [60, "usage"], [61, "usage"], [62, "usage"], [63, "usage"], [64, "usage"], [65, "usage"], [66, "usage"], [67, "usage"]], "Using Wrappers": [[5, "using-wrappers"], [10, "using-wrappers"]], "Utility Wrappers": [[6, "utility-wrappers"]], "Utils": [[4, "utils"]], "Variable Numbers of Agents (Death)": [[9, "variable-numbers-of-agents-death"]], "Vectorized (Default)": [[40, "vectorized-default"]], "Version History": [[14, "version-history"], [15, "version-history"], [16, "version-history"], [17, "version-history"], [18, "version-history"], [19, "version-history"], [20, "version-history"], [21, "version-history"], [22, "version-history"], [23, "version-history"], [24, "version-history"], [25, "version-history"], [26, "version-history"], [27, "version-history"], [28, "version-history"], [29, "version-history"], [30, "version-history"], [31, "version-history"], [32, "version-history"], [33, "version-history"], [34, "version-history"], [35, "version-history"], [36, "version-history"], [37, "version-history"], [39, "version-history"], [40, "version-history"], [41, "version-history"], [43, "version-history"], [44, "version-history"], [45, "version-history"], [46, "version-history"], [47, "version-history"], [48, "version-history"], [49, "version-history"], [50, "version-history"], [51, "version-history"], [52, "version-history"], [65, "version-history"], [66, "version-history"]], "Video Checkers": [[34, "video-checkers"]], "Volleyball Pong": [[35, "volleyball-pong"]], "WandB Integration": [[77, "wandb-integration"]], "Warlords": [[36, "warlords"]], "Watch the trained agents play": [[71, "watch-the-trained-agents-play"], [72, "watch-the-trained-agents-play"], [73, "watch-the-trained-agents-play"]], "Watching the trained RL agent play": [[87, "watching-the-trained-rl-agent-play"], [89, "watching-the-trained-rl-agent-play"]], "Waterworld": [[67, "waterworld"]], "What is DQN?": [[71, "what-is-dqn"]], "What is MADDPG?": [[72, "what-is-maddpg"]], "What is MATD3?": [[73, "what-is-matd3"]], "Wizard of Wor": [[37, "wizard-of-wor"]], "Wrappers": [[5, "wrappers"]], "cogment-verse": [[68, "cogment-verse"]], "conflict_rez": [[68, "conflict-rez"]], "pz-battlesnake": [[68, "pz-battlesnake"]], "skyjo_rl": [[68, "skyjo-rl"]], "\ud83d\udcc3 LLMs and Prompts:": [[85, "llms-and-prompts"]], "\ud83d\udcda Data Augmented Generation:": [[85, "data-augmented-generation"]], "\ud83d\udd17 Chains:": [[85, "chains"]], "\ud83e\udd16 Agents:": [[85, "agents"]], "\ud83e\uddd0 Evaluation:": [[85, "evaluation"]], "\ud83e\udde0 Memory:": [[85, "memory"]]}, "docnames": ["404", "README", "api/aec", "api/parallel", "api/utils", "api/wrappers", "api/wrappers/pz_wrappers", "api/wrappers/shimmy_wrappers", "api/wrappers/supersuit_wrappers", "content/basic_usage", "content/environment_creation", "content/environment_tests", "content/tutorials", "environments/atari", "environments/atari/basketball_pong", "environments/atari/boxing", "environments/atari/combat_plane", "environments/atari/combat_tank", "environments/atari/double_dunk", "environments/atari/entombed_competitive", "environments/atari/entombed_cooperative", "environments/atari/flag_capture", "environments/atari/foozpong", "environments/atari/ice_hockey", "environments/atari/joust", "environments/atari/mario_bros", "environments/atari/maze_craze", "environments/atari/othello", "environments/atari/pong", "environments/atari/quadrapong", "environments/atari/space_invaders", "environments/atari/space_war", "environments/atari/surround", "environments/atari/tennis", "environments/atari/video_checkers", "environments/atari/volleyball_pong", "environments/atari/warlords", "environments/atari/wizard_of_wor", "environments/butterfly", "environments/butterfly/cooperative_pong", "environments/butterfly/knights_archers_zombies", "environments/butterfly/pistonball", "environments/classic", "environments/classic/chess", "environments/classic/connect_four", "environments/classic/gin_rummy", "environments/classic/go", "environments/classic/hanabi", "environments/classic/leduc_holdem", "environments/classic/rps", "environments/classic/texas_holdem", "environments/classic/texas_holdem_no_limit", "environments/classic/tictactoe", "environments/envs", "environments/mpe", "environments/mpe/simple", "environments/mpe/simple_adversary", "environments/mpe/simple_crypto", "environments/mpe/simple_push", "environments/mpe/simple_reference", "environments/mpe/simple_speaker_listener", "environments/mpe/simple_spread", "environments/mpe/simple_tag", "environments/mpe/simple_world_comm", "environments/sisl", "environments/sisl/multiwalker", "environments/sisl/pursuit", "environments/sisl/waterworld", "environments/third_party_envs", "index", "release_notes/index", "tutorials/agilerl/DQN", "tutorials/agilerl/MADDPG", "tutorials/agilerl/MATD3", "tutorials/agilerl/index", "tutorials/cleanrl/advanced_PPO", "tutorials/cleanrl/implementing_PPO", "tutorials/cleanrl/index", "tutorials/custom_environment/1-project-structure", "tutorials/custom_environment/2-environment-logic", "tutorials/custom_environment/3-action-masking", "tutorials/custom_environment/4-testing-your-environment", "tutorials/custom_environment/5-using-your-environment", "tutorials/custom_environment/index", "tutorials/index", "tutorials/langchain/index", "tutorials/langchain/langchain", "tutorials/rllib/holdem", "tutorials/rllib/index", "tutorials/rllib/pistonball", "tutorials/sb3/connect_four", "tutorials/sb3/index", "tutorials/sb3/kaz", "tutorials/sb3/waterworld", "tutorials/tianshou/advanced", "tutorials/tianshou/beginner", "tutorials/tianshou/index", "tutorials/tianshou/intermediate"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/aec.md", "api/parallel.md", "api/utils.md", "api/wrappers.md", "api/wrappers/pz_wrappers.md", "api/wrappers/shimmy_wrappers.md", "api/wrappers/supersuit_wrappers.md", "content/basic_usage.md", "content/environment_creation.md", "content/environment_tests.md", "content/tutorials.md", "environments/atari.md", "environments/atari/basketball_pong.md", "environments/atari/boxing.md", "environments/atari/combat_plane.md", "environments/atari/combat_tank.md", "environments/atari/double_dunk.md", "environments/atari/entombed_competitive.md", "environments/atari/entombed_cooperative.md", "environments/atari/flag_capture.md", "environments/atari/foozpong.md", "environments/atari/ice_hockey.md", "environments/atari/joust.md", "environments/atari/mario_bros.md", "environments/atari/maze_craze.md", "environments/atari/othello.md", "environments/atari/pong.md", "environments/atari/quadrapong.md", "environments/atari/space_invaders.md", "environments/atari/space_war.md", "environments/atari/surround.md", "environments/atari/tennis.md", "environments/atari/video_checkers.md", "environments/atari/volleyball_pong.md", "environments/atari/warlords.md", "environments/atari/wizard_of_wor.md", "environments/butterfly.md", "environments/butterfly/cooperative_pong.md", "environments/butterfly/knights_archers_zombies.md", "environments/butterfly/pistonball.md", "environments/classic.md", "environments/classic/chess.md", "environments/classic/connect_four.md", "environments/classic/gin_rummy.md", "environments/classic/go.md", "environments/classic/hanabi.md", "environments/classic/leduc_holdem.md", "environments/classic/rps.md", "environments/classic/texas_holdem.md", "environments/classic/texas_holdem_no_limit.md", "environments/classic/tictactoe.md", "environments/envs.md", "environments/mpe.md", "environments/mpe/simple.md", "environments/mpe/simple_adversary.md", "environments/mpe/simple_crypto.md", "environments/mpe/simple_push.md", "environments/mpe/simple_reference.md", "environments/mpe/simple_speaker_listener.md", "environments/mpe/simple_spread.md", "environments/mpe/simple_tag.md", "environments/mpe/simple_world_comm.md", "environments/sisl.md", "environments/sisl/multiwalker.md", "environments/sisl/pursuit.md", "environments/sisl/waterworld.md", "environments/third_party_envs.md", "index.md", "release_notes/index.md", "tutorials/agilerl/DQN.md", "tutorials/agilerl/MADDPG.md", "tutorials/agilerl/MATD3.md", "tutorials/agilerl/index.md", "tutorials/cleanrl/advanced_PPO.md", "tutorials/cleanrl/implementing_PPO.md", "tutorials/cleanrl/index.md", "tutorials/custom_environment/1-project-structure.md", "tutorials/custom_environment/2-environment-logic.md", "tutorials/custom_environment/3-action-masking.md", "tutorials/custom_environment/4-testing-your-environment.md", "tutorials/custom_environment/5-using-your-environment.md", "tutorials/custom_environment/index.md", "tutorials/index.md", "tutorials/langchain/index.md", "tutorials/langchain/langchain.md", "tutorials/rllib/holdem.md", "tutorials/rllib/index.md", "tutorials/rllib/pistonball.md", "tutorials/sb3/connect_four.md", "tutorials/sb3/index.md", "tutorials/sb3/kaz.md", "tutorials/sb3/waterworld.md", "tutorials/tianshou/advanced.md", "tutorials/tianshou/beginner.md", "tutorials/tianshou/index.md", "tutorials/tianshou/intermediate.md"], "indexentries": {"action_space() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.action_space", false]], "action_space() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.action_space", false]], "action_space() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.action_space", false]], "action_space() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.action_space", false]], "action_space() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.action_space", false]], "action_space() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.action_space", false]], "action_space() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.action_space", false]], "action_space() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.action_space", false]], "action_space() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.action_space", false]], "action_space() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.action_space", false]], "action_space() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.action_space", false]], "action_space() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.action_space", false]], "action_space() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.action_space", false]], "action_spaces (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.action_spaces", false]], "action_spaces (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.action_spaces", false]], "aec_to_parallel() (in module pettingzoo.utils.conversions)": [[6, "pettingzoo.utils.conversions.aec_to_parallel", false]], "aecenv (class in pettingzoo.utils.env)": [[2, "pettingzoo.utils.env.AECEnv", false]], "agent_indicator_v0()": [[8, "agent_indicator_v0", false]], "agent_selection (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.agent_selection", false]], "agent_selector (class in pettingzoo.utils.agent_selector)": [[4, "pettingzoo.utils.agent_selector.agent_selector", false]], "agents (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.agents", false]], "agents (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.agents", false]], "agentselector (class in pettingzoo.utils.agent_selector)": [[4, "pettingzoo.utils.agent_selector.AgentSelector", false]], "assertoutofboundswrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.AssertOutOfBoundsWrapper", false]], "average_total_reward() (in module pettingzoo.utils.average_total_reward)": [[4, "pettingzoo.utils.average_total_reward.average_total_reward", false]], "basewrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.BaseWrapper", false]], "black_death_v2()": [[8, "black_death_v2", false]], "built-in function": [[8, "agent_indicator_v0", false], [8, "black_death_v2", false], [8, "clip_actions_v0", false], [8, "clip_reward_v0", false], [8, "color_reduction_v0", false], [8, "delay_observations_v0", false], [8, "dtype_v0", false], [8, "flatten_v0", false], [8, "frame_skip_v0", false], [8, "frame_stack_v1", false], [8, "max_observation_v0", false], [8, "nan_noop_v0", false], [8, "nan_random_v0", false], [8, "nan_zeros_v0", false], [8, "normalize_obs_v0", false], [8, "pad_action_space_v0", false], [8, "pad_observations_v0", false], [8, "reshape_v0", false], [8, "resize_v1", false], [8, "scale_actions_v0", false], [8, "sticky_actions_v0", false]], "capture_stdout (class in pettingzoo.utils.capture_stdout)": [[4, "pettingzoo.utils.capture_stdout.capture_stdout", false]], "capturestdoutwrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.CaptureStdoutWrapper", false]], "clip_actions_v0()": [[8, "clip_actions_v0", false]], "clip_reward_v0()": [[8, "clip_reward_v0", false]], "clipoutofboundswrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.ClipOutOfBoundsWrapper", false]], "close() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.close", false]], "close() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.close", false]], "close() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.close", false]], "close() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.close", false]], "close() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.close", false]], "close() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.close", false]], "close() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.close", false]], "close() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.close", false]], "close() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.close", false]], "close() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.close", false]], "close() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.close", false]], "close() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.close", false]], "close() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.close", false]], "close() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.close", false]], "color_reduction_v0()": [[8, "color_reduction_v0", false]], "delay_observations_v0()": [[8, "delay_observations_v0", false]], "dtype_v0()": [[8, "dtype_v0", false]], "env (class in pettingzoo.butterfly.cooperative_pong.cooperative_pong)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.env", false]], "env (class in pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.env", false]], "env (class in pettingzoo.butterfly.pistonball.pistonball)": [[41, "pettingzoo.butterfly.pistonball.pistonball.env", false]], "env (class in pettingzoo.classic.chess.chess)": [[43, "pettingzoo.classic.chess.chess.env", false]], "env (class in pettingzoo.classic.connect_four.connect_four)": [[44, "pettingzoo.classic.connect_four.connect_four.env", false]], "env (class in pettingzoo.classic.go.go)": [[46, "pettingzoo.classic.go.go.env", false]], "env (class in pettingzoo.classic.hanabi.hanabi)": [[47, "pettingzoo.classic.hanabi.hanabi.env", false]], "env (class in pettingzoo.classic.rlcard_envs.gin_rummy)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.env", false]], "env (class in pettingzoo.classic.rlcard_envs.leduc_holdem)": [[48, "pettingzoo.classic.rlcard_envs.leduc_holdem.env", false]], "env (class in pettingzoo.classic.rlcard_envs.texas_holdem)": [[50, "pettingzoo.classic.rlcard_envs.texas_holdem.env", false]], "env (class in pettingzoo.classic.rlcard_envs.texas_holdem_no_limit)": [[51, "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.env", false]], "env (class in pettingzoo.classic.rps.rps)": [[49, "pettingzoo.classic.rps.rps.env", false]], "env (class in pettingzoo.classic.tictactoe.tictactoe)": [[52, "pettingzoo.classic.tictactoe.tictactoe.env", false]], "env (class in pettingzoo.sisl.multiwalker.multiwalker)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.env", false]], "env (class in pettingzoo.sisl.pursuit.pursuit)": [[66, "pettingzoo.sisl.pursuit.pursuit.env", false]], "env (class in pettingzoo.sisl.waterworld.waterworld)": [[67, "pettingzoo.sisl.waterworld.waterworld.env", false]], "envlogger (class in pettingzoo.utils.env_logger)": [[4, "pettingzoo.utils.env_logger.EnvLogger", false]], "error_agent_iter_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_agent_iter_before_reset", false]], "error_nan_action() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_nan_action", false]], "error_observe_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_observe_before_reset", false]], "error_possible_agents_attribute_missing() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_possible_agents_attribute_missing", false]], "error_render_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_render_before_reset", false]], "error_state_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_state_before_reset", false]], "error_step_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_step_before_reset", false]], "flatten_v0()": [[8, "flatten_v0", false]], "flush() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.flush", false]], "frame_skip_v0()": [[8, "frame_skip_v0", false]], "frame_stack_v1()": [[8, "frame_stack_v1", false]], "get_logger() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.get_logger", false]], "infos (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.infos", false]], "is_first() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.is_first", false]], "is_last() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.is_last", false]], "max_num_agents (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.max_num_agents", false]], "max_num_agents (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.max_num_agents", false]], "max_observation_v0()": [[8, "max_observation_v0", false]], "module": [[4, "module-pettingzoo.utils.agent_selector", false], [4, "module-pettingzoo.utils.average_total_reward", false], [4, "module-pettingzoo.utils.capture_stdout", false], [4, "module-pettingzoo.utils.save_observation", false], [6, "module-pettingzoo.utils.conversions", false]], "mqueue (pettingzoo.utils.env_logger.envlogger attribute)": [[4, "pettingzoo.utils.env_logger.EnvLogger.mqueue", false]], "nan_noop_v0()": [[8, "nan_noop_v0", false]], "nan_random_v0()": [[8, "nan_random_v0", false]], "nan_zeros_v0()": [[8, "nan_zeros_v0", false]], "next() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.next", false]], "normalize_obs_v0()": [[8, "normalize_obs_v0", false]], "num_agents (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.num_agents", false]], "num_agents (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.num_agents", false]], "observation_space() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.observation_space", false]], "observation_space() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.observation_space", false]], "observation_space() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.observation_space", false]], "observation_space() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.observation_space", false]], "observation_space() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.observation_space", false]], "observation_space() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.observation_space", false]], "observation_space() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.observation_space", false]], "observation_spaces (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.observation_spaces", false]], "observation_spaces (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.observation_spaces", false]], "observe() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.observe", false]], "observe() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.observe", false]], "observe() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.observe", false]], "observe() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.observe", false]], "observe() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.observe", false]], "observe() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.observe", false]], "observe() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.observe", false]], "observe() (pettingzoo.classic.rlcard_envs.gin_rummy.raw_env method)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env.observe", false]], "observe() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.observe", false]], "observe() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.observe", false]], "observe() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.observe", false]], "observe() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.observe", false]], "observe() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.observe", false]], "observe() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.observe", false]], "orderenforcingwrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.OrderEnforcingWrapper", false]], "pad_action_space_v0()": [[8, "pad_action_space_v0", false]], "pad_observations_v0()": [[8, "pad_observations_v0", false]], "parallel_to_aec() (in module pettingzoo.utils.conversions)": [[6, "pettingzoo.utils.conversions.parallel_to_aec", false]], "parallelenv (class in pettingzoo.utils.env)": [[3, "pettingzoo.utils.env.ParallelEnv", false]], "pettingzoo.utils.agent_selector": [[4, "module-pettingzoo.utils.agent_selector", false]], "pettingzoo.utils.average_total_reward": [[4, "module-pettingzoo.utils.average_total_reward", false]], "pettingzoo.utils.capture_stdout": [[4, "module-pettingzoo.utils.capture_stdout", false]], "pettingzoo.utils.conversions": [[6, "module-pettingzoo.utils.conversions", false]], "pettingzoo.utils.save_observation": [[4, "module-pettingzoo.utils.save_observation", false]], "possible_agents (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.possible_agents", false]], "possible_agents (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.possible_agents", false]], "raw_env (class in pettingzoo.atari.basketball_pong.basketball_pong)": [[14, "pettingzoo.atari.basketball_pong.basketball_pong.raw_env", false]], "raw_env (class in pettingzoo.atari.boxing.boxing)": [[15, "pettingzoo.atari.boxing.boxing.raw_env", false]], "raw_env (class in pettingzoo.atari.combat_plane.combat_plane)": [[16, "pettingzoo.atari.combat_plane.combat_plane.raw_env", false]], "raw_env (class in pettingzoo.atari.combat_tank.combat_tank)": [[17, "pettingzoo.atari.combat_tank.combat_tank.raw_env", false]], "raw_env (class in pettingzoo.atari.double_dunk.double_dunk)": [[18, "pettingzoo.atari.double_dunk.double_dunk.raw_env", false]], "raw_env (class in pettingzoo.atari.entombed_competitive.entombed_competitive)": [[19, "pettingzoo.atari.entombed_competitive.entombed_competitive.raw_env", false]], "raw_env (class in pettingzoo.atari.entombed_cooperative.entombed_cooperative)": [[20, "pettingzoo.atari.entombed_cooperative.entombed_cooperative.raw_env", false]], "raw_env (class in pettingzoo.atari.flag_capture.flag_capture)": [[21, "pettingzoo.atari.flag_capture.flag_capture.raw_env", false]], "raw_env (class in pettingzoo.atari.foozpong.foozpong)": [[22, "pettingzoo.atari.foozpong.foozpong.raw_env", false]], "raw_env (class in pettingzoo.atari.ice_hockey.ice_hockey)": [[23, "pettingzoo.atari.ice_hockey.ice_hockey.raw_env", false]], "raw_env (class in pettingzoo.atari.joust.joust)": [[24, "pettingzoo.atari.joust.joust.raw_env", false]], "raw_env (class in pettingzoo.atari.mario_bros.mario_bros)": [[25, "pettingzoo.atari.mario_bros.mario_bros.raw_env", false]], "raw_env (class in pettingzoo.atari.maze_craze.maze_craze)": [[26, "pettingzoo.atari.maze_craze.maze_craze.raw_env", false]], "raw_env (class in pettingzoo.atari.othello.othello)": [[27, "pettingzoo.atari.othello.othello.raw_env", false]], "raw_env (class in pettingzoo.atari.pong.pong)": [[28, "pettingzoo.atari.pong.pong.raw_env", false]], "raw_env (class in pettingzoo.atari.quadrapong.quadrapong)": [[29, "pettingzoo.atari.quadrapong.quadrapong.raw_env", false]], "raw_env (class in pettingzoo.atari.space_invaders.space_invaders)": [[30, "pettingzoo.atari.space_invaders.space_invaders.raw_env", false]], "raw_env (class in pettingzoo.atari.space_war.space_war)": [[31, "pettingzoo.atari.space_war.space_war.raw_env", false]], "raw_env (class in pettingzoo.atari.surround.surround)": [[32, "pettingzoo.atari.surround.surround.raw_env", false]], "raw_env (class in pettingzoo.atari.tennis.tennis)": [[33, "pettingzoo.atari.tennis.tennis.raw_env", false]], "raw_env (class in pettingzoo.atari.video_checkers.video_checkers)": [[34, "pettingzoo.atari.video_checkers.video_checkers.raw_env", false]], "raw_env (class in pettingzoo.atari.volleyball_pong.volleyball_pong)": [[35, "pettingzoo.atari.volleyball_pong.volleyball_pong.raw_env", false]], "raw_env (class in pettingzoo.atari.warlords.warlords)": [[36, "pettingzoo.atari.warlords.warlords.raw_env", false]], "raw_env (class in pettingzoo.atari.wizard_of_wor.wizard_of_wor)": [[37, "pettingzoo.atari.wizard_of_wor.wizard_of_wor.raw_env", false]], "raw_env (class in pettingzoo.butterfly.cooperative_pong.cooperative_pong)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env", false]], "raw_env (class in pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env", false]], "raw_env (class in pettingzoo.butterfly.pistonball.pistonball)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env", false]], "raw_env (class in pettingzoo.classic.chess.chess)": [[43, "pettingzoo.classic.chess.chess.raw_env", false]], "raw_env (class in pettingzoo.classic.connect_four.connect_four)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env", false]], "raw_env (class in pettingzoo.classic.go.go)": [[46, "pettingzoo.classic.go.go.raw_env", false]], "raw_env (class in pettingzoo.classic.hanabi.hanabi)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env", false]], "raw_env (class in pettingzoo.classic.rlcard_envs.gin_rummy)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env", false]], "raw_env (class in pettingzoo.classic.rlcard_envs.leduc_holdem)": [[48, "pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env", false]], "raw_env (class in pettingzoo.classic.rlcard_envs.texas_holdem)": [[50, "pettingzoo.classic.rlcard_envs.texas_holdem.raw_env", false]], "raw_env (class in pettingzoo.classic.rlcard_envs.texas_holdem_no_limit)": [[51, "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env", false]], "raw_env (class in pettingzoo.classic.rps.rps)": [[49, "pettingzoo.classic.rps.rps.raw_env", false]], "raw_env (class in pettingzoo.classic.tictactoe.tictactoe)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple.simple)": [[55, "pettingzoo.mpe.simple.simple.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_adversary.simple_adversary)": [[56, "pettingzoo.mpe.simple_adversary.simple_adversary.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_crypto.simple_crypto)": [[57, "pettingzoo.mpe.simple_crypto.simple_crypto.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_push.simple_push)": [[58, "pettingzoo.mpe.simple_push.simple_push.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_reference.simple_reference)": [[59, "pettingzoo.mpe.simple_reference.simple_reference.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_speaker_listener.simple_speaker_listener)": [[60, "pettingzoo.mpe.simple_speaker_listener.simple_speaker_listener.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_spread.simple_spread)": [[61, "pettingzoo.mpe.simple_spread.simple_spread.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_tag.simple_tag)": [[62, "pettingzoo.mpe.simple_tag.simple_tag.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_world_comm.simple_world_comm)": [[63, "pettingzoo.mpe.simple_world_comm.simple_world_comm.raw_env", false]], "raw_env (class in pettingzoo.sisl.multiwalker.multiwalker)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env", false]], "raw_env (class in pettingzoo.sisl.pursuit.pursuit)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env", false]], "raw_env (class in pettingzoo.sisl.waterworld.waterworld)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env", false]], "reinit() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.reinit", false]], "render() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.render", false]], "render() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.render", false]], "render() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.render", false]], "render() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.render", false]], "render() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.render", false]], "render() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.render", false]], "render() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.render", false]], "render() (pettingzoo.classic.rlcard_envs.gin_rummy.raw_env method)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env.render", false]], "render() (pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env method)": [[48, "pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env.render", false]], "render() (pettingzoo.classic.rlcard_envs.texas_holdem.raw_env method)": [[50, "pettingzoo.classic.rlcard_envs.texas_holdem.raw_env.render", false]], "render() (pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env method)": [[51, "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env.render", false]], "render() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.render", false]], "render() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.render", false]], "render() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.render", false]], "render() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.render", false]], "render() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.render", false]], "render() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.render", false]], "render() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.render", false]], "reset() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.reset", false]], "reset() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.reset", false]], "reset() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.reset", false]], "reset() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.reset", false]], "reset() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.reset", false]], "reset() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.reset", false]], "reset() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.reset", false]], "reset() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.reset", false]], "reset() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.reset", false]], "reset() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.reset", false]], "reset() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.reset", false]], "reset() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.reset", false]], "reset() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.reset", false]], "reset() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.reset", false]], "reset() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.reset", false]], "reshape_v0()": [[8, "reshape_v0", false]], "resize_v1()": [[8, "resize_v1", false]], "rewards (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.rewards", false]], "save_observation() (in module pettingzoo.utils.save_observation)": [[4, "pettingzoo.utils.save_observation.save_observation", false]], "scale_actions_v0()": [[8, "scale_actions_v0", false]], "state() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.state", false]], "state() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.state", false]], "state() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.state", false]], "state() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.state", false]], "state() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.state", false]], "step() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.step", false]], "step() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.step", false]], "step() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.step", false]], "step() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.step", false]], "step() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.step", false]], "step() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.step", false]], "step() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.step", false]], "step() (pettingzoo.classic.rlcard_envs.gin_rummy.raw_env method)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env.step", false]], "step() (pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env method)": [[48, "pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env.step", false]], "step() (pettingzoo.classic.rlcard_envs.texas_holdem.raw_env method)": [[50, "pettingzoo.classic.rlcard_envs.texas_holdem.raw_env.step", false]], "step() (pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env method)": [[51, "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env.step", false]], "step() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.step", false]], "step() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.step", false]], "step() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.step", false]], "step() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.step", false]], "step() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.step", false]], "step() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.step", false]], "step() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.step", false]], "sticky_actions_v0()": [[8, "sticky_actions_v0", false]], "suppress_output() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.suppress_output", false]], "terminateillegalwrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.TerminateIllegalWrapper", false]], "terminations (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.terminations", false]], "truncations (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.truncations", false]], "unsuppress_output() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.unsuppress_output", false]], "warn_action_out_of_bound() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.warn_action_out_of_bound", false]], "warn_on_illegal_move() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.warn_on_illegal_move", false]], "warn_step_after_terminated_truncated() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.warn_step_after_terminated_truncated", false]]}, "objects": {"": [[8, 0, 1, "", "agent_indicator_v0"], [8, 0, 1, "", "black_death_v2"], [8, 0, 1, "", "clip_actions_v0"], [8, 0, 1, "", "clip_reward_v0"], [8, 0, 1, "", "color_reduction_v0"], [8, 0, 1, "", "delay_observations_v0"], [8, 0, 1, "", "dtype_v0"], [8, 0, 1, "", "flatten_v0"], [8, 0, 1, "", "frame_skip_v0"], [8, 0, 1, "", "frame_stack_v1"], [8, 0, 1, "", "max_observation_v0"], [8, 0, 1, "", "nan_noop_v0"], [8, 0, 1, "", "nan_random_v0"], [8, 0, 1, "", "nan_zeros_v0"], [8, 0, 1, "", "normalize_obs_v0"], [8, 0, 1, "", "pad_action_space_v0"], [8, 0, 1, "", "pad_observations_v0"], [8, 0, 1, "", "reshape_v0"], [8, 0, 1, "", "resize_v1"], [8, 0, 1, "", "scale_actions_v0"], [8, 0, 1, "", "sticky_actions_v0"]], "pettingzoo.atari.basketball_pong.basketball_pong": [[14, 1, 1, "", "raw_env"]], "pettingzoo.atari.boxing.boxing": [[15, 1, 1, "", "raw_env"]], "pettingzoo.atari.combat_plane.combat_plane": [[16, 1, 1, "", "raw_env"]], "pettingzoo.atari.combat_tank.combat_tank": [[17, 1, 1, "", "raw_env"]], "pettingzoo.atari.double_dunk.double_dunk": [[18, 1, 1, "", "raw_env"]], "pettingzoo.atari.entombed_competitive.entombed_competitive": [[19, 1, 1, "", "raw_env"]], "pettingzoo.atari.entombed_cooperative.entombed_cooperative": [[20, 1, 1, "", "raw_env"]], "pettingzoo.atari.flag_capture.flag_capture": [[21, 1, 1, "", "raw_env"]], "pettingzoo.atari.foozpong.foozpong": [[22, 1, 1, "", "raw_env"]], "pettingzoo.atari.ice_hockey.ice_hockey": [[23, 1, 1, "", "raw_env"]], "pettingzoo.atari.joust.joust": [[24, 1, 1, "", "raw_env"]], "pettingzoo.atari.mario_bros.mario_bros": [[25, 1, 1, "", "raw_env"]], "pettingzoo.atari.maze_craze.maze_craze": [[26, 1, 1, "", "raw_env"]], "pettingzoo.atari.othello.othello": [[27, 1, 1, "", "raw_env"]], "pettingzoo.atari.pong.pong": [[28, 1, 1, "", "raw_env"]], "pettingzoo.atari.quadrapong.quadrapong": [[29, 1, 1, "", "raw_env"]], "pettingzoo.atari.space_invaders.space_invaders": [[30, 1, 1, "", "raw_env"]], "pettingzoo.atari.space_war.space_war": [[31, 1, 1, "", "raw_env"]], "pettingzoo.atari.surround.surround": [[32, 1, 1, "", "raw_env"]], "pettingzoo.atari.tennis.tennis": [[33, 1, 1, "", "raw_env"]], "pettingzoo.atari.video_checkers.video_checkers": [[34, 1, 1, "", "raw_env"]], "pettingzoo.atari.volleyball_pong.volleyball_pong": [[35, 1, 1, "", "raw_env"]], "pettingzoo.atari.warlords.warlords": [[36, 1, 1, "", "raw_env"]], "pettingzoo.atari.wizard_of_wor.wizard_of_wor": [[37, 1, 1, "", "raw_env"]], "pettingzoo.butterfly.cooperative_pong.cooperative_pong": [[39, 1, 1, "", "env"], [39, 1, 1, "", "raw_env"]], "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env": [[39, 2, 1, "", "action_space"], [39, 2, 1, "", "close"], [39, 2, 1, "", "observation_space"], [39, 2, 1, "", "observe"], [39, 2, 1, "", "render"], [39, 2, 1, "", "reset"], [39, 2, 1, "", "state"], [39, 2, 1, "", "step"]], "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies": [[40, 1, 1, "", "env"], [40, 1, 1, "", "raw_env"]], "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env": [[40, 2, 1, "", "action_space"], [40, 2, 1, "", "close"], [40, 2, 1, "", "observation_space"], [40, 2, 1, "", "observe"], [40, 2, 1, "", "render"], [40, 2, 1, "", "reset"], [40, 2, 1, "", "state"], [40, 2, 1, "", "step"]], "pettingzoo.butterfly.pistonball.pistonball": [[41, 1, 1, "", "env"], [41, 1, 1, "", "raw_env"]], "pettingzoo.butterfly.pistonball.pistonball.raw_env": [[41, 2, 1, "", "action_space"], [41, 2, 1, "", "close"], [41, 2, 1, "", "observation_space"], [41, 2, 1, "", "observe"], [41, 2, 1, "", "render"], [41, 2, 1, "", "reset"], [41, 2, 1, "", "state"], [41, 2, 1, "", "step"]], "pettingzoo.classic.chess.chess": [[43, 1, 1, "", "env"], [43, 1, 1, "", "raw_env"]], "pettingzoo.classic.chess.chess.raw_env": [[43, 2, 1, "", "action_space"], [43, 2, 1, "", "close"], [43, 2, 1, "", "observation_space"], [43, 2, 1, "", "observe"], [43, 2, 1, "", "render"], [43, 2, 1, "", "reset"], [43, 2, 1, "", "step"]], "pettingzoo.classic.connect_four.connect_four": [[44, 1, 1, "", "env"], [44, 1, 1, "", "raw_env"]], "pettingzoo.classic.connect_four.connect_four.raw_env": [[44, 2, 1, "", "action_space"], [44, 2, 1, "", "close"], [44, 2, 1, "", "observation_space"], [44, 2, 1, "", "observe"], [44, 2, 1, "", "render"], [44, 2, 1, "", "reset"], [44, 2, 1, "", "step"]], "pettingzoo.classic.go.go": [[46, 1, 1, "", "env"], [46, 1, 1, "", "raw_env"]], "pettingzoo.classic.go.go.raw_env": [[46, 2, 1, "", "action_space"], [46, 2, 1, "", "close"], [46, 2, 1, "", "observation_space"], [46, 2, 1, "", "observe"], [46, 2, 1, "", "render"], [46, 2, 1, "", "reset"], [46, 2, 1, "", "step"]], "pettingzoo.classic.hanabi.hanabi": [[47, 1, 1, "", "env"], [47, 1, 1, "", "raw_env"]], "pettingzoo.classic.hanabi.hanabi.raw_env": [[47, 2, 1, "", "action_space"], [47, 2, 1, "", "close"], [47, 2, 1, "", "observation_space"], [47, 2, 1, "", "observe"], [47, 2, 1, "", "render"], [47, 2, 1, "", "reset"], [47, 2, 1, "", "step"]], "pettingzoo.classic.rlcard_envs.gin_rummy": [[45, 1, 1, "", "env"], [45, 1, 1, "", "raw_env"]], "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env": [[45, 2, 1, "", "observe"], [45, 2, 1, "", "render"], [45, 2, 1, "", "step"]], "pettingzoo.classic.rlcard_envs.leduc_holdem": [[48, 1, 1, "", "env"], [48, 1, 1, "", "raw_env"]], "pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env": [[48, 2, 1, "", "render"], [48, 2, 1, "", "step"]], "pettingzoo.classic.rlcard_envs.texas_holdem": [[50, 1, 1, "", "env"], [50, 1, 1, "", "raw_env"]], "pettingzoo.classic.rlcard_envs.texas_holdem.raw_env": [[50, 2, 1, "", "render"], [50, 2, 1, "", "step"]], "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit": [[51, 1, 1, "", "env"], [51, 1, 1, "", "raw_env"]], "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env": [[51, 2, 1, "", "render"], [51, 2, 1, "", "step"]], "pettingzoo.classic.rps.rps": [[49, 1, 1, "", "env"], [49, 1, 1, "", "raw_env"]], "pettingzoo.classic.rps.rps.raw_env": [[49, 2, 1, "", "action_space"], [49, 2, 1, "", "close"], [49, 2, 1, "", "observation_space"], [49, 2, 1, "", "observe"], [49, 2, 1, "", "render"], [49, 2, 1, "", "reset"], [49, 2, 1, "", "step"]], "pettingzoo.classic.tictactoe.tictactoe": [[52, 1, 1, "", "env"], [52, 1, 1, "", "raw_env"]], "pettingzoo.classic.tictactoe.tictactoe.raw_env": [[52, 2, 1, "", "action_space"], [52, 2, 1, "", "close"], [52, 2, 1, "", "observation_space"], [52, 2, 1, "", "observe"], [52, 2, 1, "", "render"], [52, 2, 1, "", "reset"], [52, 2, 1, "", "step"]], "pettingzoo.mpe.simple.simple": [[55, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_adversary.simple_adversary": [[56, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_crypto.simple_crypto": [[57, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_push.simple_push": [[58, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_reference.simple_reference": [[59, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_speaker_listener.simple_speaker_listener": [[60, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_spread.simple_spread": [[61, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_tag.simple_tag": [[62, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_world_comm.simple_world_comm": [[63, 1, 1, "", "raw_env"]], "pettingzoo.sisl.multiwalker.multiwalker": [[65, 1, 1, "", "env"], [65, 1, 1, "", "raw_env"]], "pettingzoo.sisl.multiwalker.multiwalker.raw_env": [[65, 2, 1, "", "action_space"], [65, 2, 1, "", "close"], [65, 2, 1, "", "observation_space"], [65, 2, 1, "", "observe"], [65, 2, 1, "", "render"], [65, 2, 1, "", "reset"], [65, 2, 1, "", "state"], [65, 2, 1, "", "step"]], "pettingzoo.sisl.pursuit.pursuit": [[66, 1, 1, "", "env"], [66, 1, 1, "", "raw_env"]], "pettingzoo.sisl.pursuit.pursuit.raw_env": [[66, 2, 1, "", "action_space"], [66, 2, 1, "", "close"], [66, 2, 1, "", "observation_space"], [66, 2, 1, "", "observe"], [66, 2, 1, "", "render"], [66, 2, 1, "", "reset"], [66, 2, 1, "", "step"]], "pettingzoo.sisl.waterworld.waterworld": [[67, 1, 1, "", "env"], [67, 1, 1, "", "raw_env"]], "pettingzoo.sisl.waterworld.waterworld.raw_env": [[67, 2, 1, "", "action_space"], [67, 2, 1, "", "close"], [67, 2, 1, "", "observation_space"], [67, 2, 1, "", "observe"], [67, 2, 1, "", "render"], [67, 2, 1, "", "reset"], [67, 2, 1, "", "step"]], "pettingzoo.utils": [[4, 3, 0, "-", "agent_selector"], [4, 3, 0, "-", "average_total_reward"], [4, 3, 0, "-", "capture_stdout"], [6, 3, 0, "-", "conversions"], [4, 3, 0, "-", "save_observation"]], "pettingzoo.utils.agent_selector": [[4, 1, 1, "", "AgentSelector"], [4, 1, 1, "", "agent_selector"]], "pettingzoo.utils.agent_selector.AgentSelector": [[4, 2, 1, "", "is_first"], [4, 2, 1, "", "is_last"], [4, 2, 1, "", "next"], [4, 2, 1, "", "reinit"], [4, 2, 1, "", "reset"]], "pettingzoo.utils.average_total_reward": [[4, 0, 1, "", "average_total_reward"]], "pettingzoo.utils.capture_stdout": [[4, 1, 1, "", "capture_stdout"]], "pettingzoo.utils.conversions": [[6, 0, 1, "", "aec_to_parallel"], [6, 0, 1, "", "parallel_to_aec"]], "pettingzoo.utils.env": [[2, 1, 1, "", "AECEnv"], [3, 1, 1, "", "ParallelEnv"]], "pettingzoo.utils.env.AECEnv": [[2, 4, 1, "", "action_spaces"], [2, 4, 1, "", "agent_selection"], [2, 4, 1, "", "agents"], [2, 2, 1, "", "close"], [2, 4, 1, "", "infos"], [2, 4, 1, "", "max_num_agents"], [2, 4, 1, "", "num_agents"], [2, 4, 1, "", "observation_spaces"], [2, 2, 1, "", "observe"], [2, 4, 1, "", "possible_agents"], [2, 2, 1, "", "render"], [2, 2, 1, "", "reset"], [2, 4, 1, "", "rewards"], [2, 2, 1, "", "step"], [2, 4, 1, "", "terminations"], [2, 4, 1, "", "truncations"]], "pettingzoo.utils.env.ParallelEnv": [[3, 2, 1, "", "action_space"], [3, 4, 1, "", "action_spaces"], [3, 4, 1, "", "agents"], [3, 2, 1, "", "close"], [3, 4, 1, "", "max_num_agents"], [3, 4, 1, "", "num_agents"], [3, 2, 1, "", "observation_space"], [3, 4, 1, "", "observation_spaces"], [3, 4, 1, "", "possible_agents"], [3, 2, 1, "", "render"], [3, 2, 1, "", "reset"], [3, 2, 1, "", "state"], [3, 2, 1, "", "step"]], "pettingzoo.utils.env_logger": [[4, 1, 1, "", "EnvLogger"]], "pettingzoo.utils.env_logger.EnvLogger": [[4, 2, 1, "", "error_agent_iter_before_reset"], [4, 2, 1, "", "error_nan_action"], [4, 2, 1, "", "error_observe_before_reset"], [4, 2, 1, "", "error_possible_agents_attribute_missing"], [4, 2, 1, "", "error_render_before_reset"], [4, 2, 1, "", "error_state_before_reset"], [4, 2, 1, "", "error_step_before_reset"], [4, 2, 1, "", "flush"], [4, 2, 1, "", "get_logger"], [4, 4, 1, "", "mqueue"], [4, 2, 1, "", "suppress_output"], [4, 2, 1, "", "unsuppress_output"], [4, 2, 1, "", "warn_action_out_of_bound"], [4, 2, 1, "", "warn_on_illegal_move"], [4, 2, 1, "", "warn_step_after_terminated_truncated"]], "pettingzoo.utils.save_observation": [[4, 0, 1, "", "save_observation"]], "pettingzoo.utils.wrappers": [[6, 1, 1, "", "AssertOutOfBoundsWrapper"], [6, 1, 1, "", "BaseWrapper"], [6, 1, 1, "", "CaptureStdoutWrapper"], [6, 1, 1, "", "ClipOutOfBoundsWrapper"], [6, 1, 1, "", "OrderEnforcingWrapper"], [6, 1, 1, "", "TerminateIllegalWrapper"]]}, "objnames": {"0": ["py", "function", "Python function"], "1": ["py", "class", "Python class"], "2": ["py", "method", "Python method"], "3": ["py", "module", "Python module"], "4": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:function", "1": "py:class", "2": "py:method", "3": "py:module", "4": "py:attribute"}, "terms": {"": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 16, 17, 19, 20, 21, 22, 23, 25, 27, 29, 30, 34, 35, 39, 40, 41, 43, 44, 45, 46, 47, 48, 50, 51, 54, 63, 65, 67, 68, 70, 71, 72, 73, 74, 75, 76, 77, 79, 80, 86, 87, 88, 89, 90, 92, 93, 94], "0": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "000001": 71, "0001": [71, 72], "001": [12, 72, 73, 76], "01": [12, 66, 67, 70, 71, 72, 73, 75, 76], "015": 67, "02": [70, 71], "03": [70, 90, 91], "04": [70, 90], "04376": 42, "04908": 54, "05": [63, 70, 71, 94, 97], "06": [70, 87, 89, 90], "07": 70, "08": 70, "08932": 8, "09": 70, "09341": 13, "0th": 47, "1": [2, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "10": [9, 11, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 34, 39, 40, 46, 47, 54, 56, 59, 62, 65, 67, 71, 72, 73, 87, 89, 92, 93, 94, 95, 97], "100": [4, 10, 15, 26, 30, 39, 41, 45, 47, 51, 65, 71, 72, 73, 79, 80, 86, 90, 92, 93], "1000": [11, 37, 45, 48, 50, 51, 52, 94, 97], "10000": [47, 72], "100000": [13, 71, 73, 87], "10000000": 87, "10000000000": 4, "1002": 70, "1003": 70, "1004": 70, "1010": 70, "1011": 70, "1012": 70, "1013": 70, "1014": 70, "1015": 70, "1016": 70, "1017": 70, "1018": 70, "1019": 70, "1020": 70, "1024": [13, 70], "1026": 70, "1029": 70, "1031": 70, "1033": 70, "1034": 70, "1036": 70, "1037": 70, "1038": 70, "1041": 70, "1045": 70, "1046": 70, "1047": 70, "1051": 70, "1054": 70, "1055": 70, "1057": 70, "1058": 70, "1071": 70, "1074": 70, "1077": 70, "1080": 70, "1082": 70, "1083": 70, "1084": 70, "1086": 70, "1087": 70, "1088": 70, "1089": 70, "109": 45, "1090": 70, "1092": 70, "1095": 70, "1096": 70, "1097": 70, "10_000": [90, 92, 93], "10k": 90, "10x": 90, "11": [9, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 39, 43, 45, 46, 47, 48, 50, 51, 60, 65, 75, 76], "110": 45, "1103": 70, "1105": 70, "1107": 70, "111": 43, "1110": 70, "11111": 47, "1112": 70, "1116": 70, "1120": 70, "1124": 70, "1128": 70, "1129": 70, "1130": 70, "1133": 70, "1134": 70, "1135": 70, "1137": 70, "1139": 70, "1140": 70, "1144": 70, "1148": 70, "1149": 70, "1152": 70, "1153": 70, "1154": 70, "1155": 70, "11_12": [87, 89], "12": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 39, 43, 45, 47, 50, 51, 65], "120": [18, 41, 71, 72], "1200": 15, "12000": 75, "124": 47, "125": [12, 41, 47, 76, 89], "128": [12, 71, 72, 73, 75, 76, 89, 94, 97], "1280": 40, "13": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 43, 45, 47, 50, 51, 65, 71, 72, 73, 75, 76, 87, 89], "14": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 39, 40, 45, 47, 48, 50, 51, 60, 62, 65, 66], "15": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 47, 49, 65, 71, 72, 73], "150": 71, "16": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 40, 47, 62, 66, 75], "160": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "1626": 94, "16x16": 40, "17": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 40, 47], "1703": 54, "174": 47, "175": 47, "179": 47, "18": [9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 43, 45, 47, 61, 72, 73, 79, 80], "180": 47, "184": 47, "185": 47, "189": 47, "19": [43, 45, 46, 47, 48, 58, 87, 89], "190": 47, "1910": 42, "192": 63, "195": 47, "196_608": 93, "199": 47, "1_000_000": 81, "1d": 8, "1e": [12, 65, 71, 75, 76, 90, 93, 94, 97], "1e10": 87, "1st": [43, 46, 47], "2": [7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "20": [40, 41, 43, 47, 48, 57, 63, 67, 71, 72, 73, 86, 89, 90], "200": [12, 30, 37, 47, 65, 71, 76, 87], "20000": [25, 94], "200000": 71, "2000000": 75, "2008": 8, "2009": 13, "2013": 13, "2017": [54, 64], "2018": [8, 13], "2019": 42, "2020": [8, 13, 70], "2021": 70, "2022": [2, 7, 70, 91], "2023": 70, "2024": 70, "207": 47, "208": 47, "20_000": 97, "20_480": 90, "20k": 90, "21": [48, 94, 95, 97], "210": [14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 32, 33, 34, 35, 36, 37, 47], "211": 47, "22": [48, 67, 71, 72, 73, 94, 95, 97], "23": [20, 43, 47, 65, 71, 72, 73, 94, 95, 97], "24": [47, 65, 71, 72, 73, 75, 76, 87, 89, 90, 92, 93], "242": [67, 93], "25": [9, 13, 45, 47, 50, 51, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 70, 73, 89, 91], "250": [7, 26, 31], "2500": 37, "253": 13, "255": [12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 71, 72, 73, 75, 76], "256": [16, 71, 75, 92, 93], "26": [45, 50, 51, 65, 70], "260": 47, "261": 47, "262": 47, "263": 47, "266": 47, "267": 47, "268": 47, "269": 47, "27": [45, 50, 51, 58, 65, 70], "273": 47, "274": 47, "278": 47, "279": [13, 47], "28": [56, 59, 63, 65, 70, 71, 72, 73], "280": [39, 47], "281": 47, "282": 47, "283": 47, "29": [65, 70], "2d": [8, 46, 67], "2e": 89, "2f": [72, 73], "2n": 46, "2nd": [46, 47], "2x3": 71, "3": [8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 45, 46, 47, 48, 49, 50, 51, 52, 56, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 92, 93, 94, 95, 97], "30": [30, 65, 66, 67, 87, 89, 90], "300": 65, "3000": 24, "30000": 71, "307": 47, "308": 47, "31": [45, 65, 71, 72, 73], "3136": 89, "32": [12, 45, 72, 73, 75, 76, 89], "320": [94, 97], "32999": 70, "33": 48, "34": 63, "342": 47, "343": 47, "34696": 70, "35": 48, "36": 48, "362": 46, "377": 47, "378": 47, "38": [45, 50, 51], "39": [45, 50, 51], "3d": 8, "3rd": [47, 70], "3x3": 52, "4": [8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 57, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 94, 95, 97], "40": [45, 50, 51, 90], "400": 71, "4000": 96, "40k": 90, "40x40": 40, "412": 47, "413": 47, "42": [2, 3, 4, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 69], "44": 45, "445": 47, "447": 47, "45": [45, 71], "457": 41, "4672": 43, "47": 13, "480": 39, "482": 47, "483": 47, "49": 47, "4th": 47, "4x": 74, "4x2x2": 71, "4x2x3": 71, "4x2x3x2": 71, "5": [11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 89, 90, 92, 94, 95, 97], "50": [7, 43, 47, 59, 62, 63, 70, 71, 87, 89, 90, 94, 97], "500": [65, 66, 67, 71, 72, 73], "50000": [87, 89], "5000000": 89, "51": [45, 50, 51, 71], "512": [12, 40, 75, 76, 89], "512px": 92, "512x512": 40, "517": 47, "518": 47, "52": [45, 50, 51], "523": 13, "53": [50, 51], "54": [51, 61], "552": 47, "553": 47, "56": [43, 50], "560": [39, 41], "562": 13, "57": [45, 50, 87, 89], "58": [45, 50], "587": 47, "588": 47, "59": 45, "5cat": 70, "5e": 75, "5th": 43, "5x52": 45, "6": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 40, 41, 43, 44, 45, 46, 47, 48, 49, 52, 63, 65, 67, 71, 74, 75, 79, 80, 86, 94, 95, 97], "6000": [71, 72, 73], "600000": 71, "61": [13, 50], "612": 71, "62": [50, 62], "621": 70, "622": 47, "63": [9, 50], "64": [12, 71, 72, 75, 76, 89, 94, 97], "65": [71, 72, 73], "657": 47, "658": 47, "66": [50, 64], "663": 47, "67": 50, "68": 50, "6x7": 44, "6x7x2": 71, "7": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37, 43, 44, 45, 46, 47, 48, 49, 52, 65, 66, 67, 71, 75, 79, 80, 87, 89, 94], "70": [7, 45], "700": 71, "71": [45, 50], "72": 50, "720": 40, "73": 43, "731": 70, "732": 70, "734": 70, "737": 70, "738": 70, "739": 70, "74": 47, "741": 70, "743": 70, "747": 70, "748": 70, "749": 70, "75": [41, 47, 65, 67, 89, 90], "750": 70, "76": 90, "763": 70, "767": 70, "776": 70, "777": 70, "779": 70, "780": 70, "781": 70, "782": 70, "787": 70, "788": 70, "789": 70, "790": 70, "796": 70, "798": 70, "7e": 90, "7x7": 79, "8": [9, 12, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37, 43, 44, 45, 46, 47, 48, 50, 51, 52, 56, 57, 58, 59, 65, 66, 67, 71, 72, 75, 76, 86, 89, 92, 93, 94, 95, 97], "80": 90, "800": [25, 41, 43, 46, 49, 70], "8000": 75, "802": 70, "804": 70, "807": 70, "808": 70, "809": 70, "810": 70, "814": 70, "817": 70, "818": 70, "8192": 90, "81_920": 92, "821": 70, "822": 70, "823": 70, "825": 70, "829": 70, "83": [45, 64], "831": 70, "832": 70, "833": 70, "835": 70, "836": 70, "837": 70, "838": 70, "839": 70, "84": [13, 45, 72, 75, 89, 92], "840": 70, "841": 70, "842": 70, "843": 70, "844": 70, "845": 70, "846": 70, "847": 70, "848": 70, "84px": 92, "850": 70, "852": 70, "853": 70, "854": 70, "855": 70, "856": 70, "857": 70, "858": 70, "859": 70, "86": 90, "865": 70, "867": 70, "869": 70, "870": 70, "872": 70, "874": 70, "875": 70, "876": 70, "879": 70, "880": [41, 70], "882": 70, "883": 70, "886": 70, "890": 70, "891": 70, "894": 70, "897": 70, "8th": 43, "8x8": 43, "8x8x73": 43, "9": [9, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 37, 39, 43, 44, 46, 47, 49, 62, 63, 65, 71, 72, 73, 75, 76, 87, 89, 92, 93, 94, 97], "900": [9, 39, 40, 72], "903": 70, "904": 70, "906": 70, "907": 70, "908": 70, "942": 70, "948": 70, "95": [72, 73, 75], "950": 70, "953": 70, "954": 70, "96": 45, "960": [39, 70], "964": 70, "968": 70, "97": 45, "970": 70, "972": 70, "975": 70, "979": 70, "980": 70, "984": 70, "985": 70, "986": 70, "987": 70, "99": [12, 71, 75, 76, 89], "990": 70, "991": 70, "992": 70, "993": 70, "994": 70, "995": [72, 73], "997": 70, "998": 70, "999": 70, "9998": 71, "A": [2, 3, 5, 6, 9, 10, 14, 21, 25, 26, 32, 33, 34, 40, 41, 42, 43, 44, 45, 47, 50, 51, 66, 68, 71, 77, 78, 92], "And": [3, 10, 79, 80], "As": [11, 38, 40, 47, 48, 64, 70, 71], "At": [4, 8, 10, 44, 45, 47, 48, 51, 61, 71, 78], "But": [14, 32, 54], "By": [2, 4, 47, 62, 63, 65, 66, 71], "For": [1, 2, 3, 7, 8, 10, 11, 13, 40, 41, 43, 45, 46, 47, 52, 57, 65, 67, 70, 71, 72, 73, 74, 79, 80, 83, 86, 90, 91, 92, 93], "If": [2, 3, 4, 6, 7, 8, 9, 10, 11, 13, 14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 44, 45, 47, 49, 52, 54, 64, 65, 67, 68, 71, 72, 73, 75, 76, 79, 80, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "In": [2, 3, 6, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 40, 41, 42, 43, 51, 54, 55, 56, 57, 63, 65, 68, 70, 71, 80, 90], "It": [3, 4, 9, 10, 39, 43, 65, 68, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97], "Its": 26, "NOT": 75, "No": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 70, 95], "Not": [9, 73], "Of": 13, "On": 23, "One": [43, 47, 56, 85], "THE": [12, 76], "TO": 75, "That": 47, "The": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 15, 16, 17, 18, 20, 25, 26, 27, 30, 31, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 58, 59, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 75, 76, 77, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "Their": 9, "Then": [75, 91], "There": [9, 13, 25, 26, 39, 40, 45, 47, 70, 85], "These": [2, 3, 9, 10, 42, 43, 47, 54, 67, 68, 70, 74, 79, 80, 83, 85, 88, 90, 91, 96], "To": [1, 2, 6, 7, 8, 9, 10, 11, 13, 22, 27, 32, 34, 38, 39, 42, 54, 64, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "Will": [94, 95, 97], "_": [8, 12, 71, 72, 73, 75, 76, 87, 90, 92, 93, 94, 97], "__": 75, "_____": 86, "_________": 52, "__doc__": 86, "__file__": 75, "__future__": [92, 93], "__init__": [8, 10, 12, 71, 75, 76, 78, 79, 80, 86, 87, 89], "__main__": [12, 71, 72, 73, 75, 76, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "__name__": [12, 71, 72, 73, 75, 76, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "_accumulate_reward": 10, "_act": 86, "_action_emb": 87, "_action_spac": 10, "_agent_selector": 10, "_build": 1, "_clear_reward": 10, "_cumulative_reward": [10, 90], "_elit": 71, "_get_ag": 97, "_get_env": 97, "_label_with_episode_numb": [71, 72, 73], "_layer_init": [12, 76], "_observation_spac": 10, "_opp": 71, "_script": 1, "_value_out": 89, "_was_dead_step": 10, "ab": [12, 75, 76], "abbeel": 54, "abil": [30, 71], "abl": [9, 11, 16, 21, 26, 35], "about": [1, 3, 6, 41, 47, 54, 65, 67, 70, 71, 74, 78, 79, 85, 90], "abov": [9, 24, 26, 35, 41, 78, 87], "absolut": [40, 54, 81], "ac": 45, "acceler": [31, 67, 70], "accept": [2, 8, 9, 10, 16, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 70, 90], "access": [2, 6, 9, 12, 54, 70, 76, 90, 91, 97], "accord": [2, 71, 72, 73, 86], "accordingli": 41, "account": [10, 31, 70, 71], "accumul": [8, 10, 43], "accur": 74, "achiev": [38, 41, 54, 65, 71], "acpc": 51, "across": [4, 30, 41, 70, 77], "act": [2, 8, 9, 10, 41, 49, 67, 71, 72, 73, 78, 86, 90, 92, 93], "act_messag": 86, "act_spac": [87, 89], "action": [3, 4, 6, 7, 8, 9, 10, 12, 13, 38, 39, 40, 41, 42, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 69, 70, 71, 72, 73, 75, 76, 78, 79, 83, 85, 87, 89, 91, 94], "action_": 71, "action_6": 49, "action_7": 49, "action_dim": [71, 72, 73], "action_embed_model": 87, "action_logit": 87, "action_mask": [2, 7, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 71, 80, 86, 87, 90], "action_mask_fn": 90, "action_masking_ag": 86, "action_pars": 86, "action_shap": [94, 97], "action_spac": [2, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 90, 92, 94, 97], "actiondict": 70, "actionmask": 90, "actionmaskag": 86, "actiontyp": [2, 3, 6], "activ": [25, 41, 70, 71, 72, 73, 92], "actor": [9, 12, 54, 68, 71, 72, 73, 75, 76], "actual": [11, 70, 86], "ad": [2, 3, 8, 9, 11, 39, 41, 49, 65, 66, 67, 70, 71, 81], "adam": [12, 71, 75, 76, 94, 97], "adapt": [70, 75, 91], "add": [8, 9, 10, 12, 39, 40, 49, 57, 66, 67, 70, 76, 92, 94], "add_argu": [75, 87, 89, 94], "add_scalar": 75, "add_text": [75, 94], "addit": [3, 4, 8, 11, 19, 20, 35, 37, 41, 45, 48, 49, 51, 65, 70], "addition": [8, 26, 41, 64], "address": 70, "adopt": [43, 44, 45, 46, 47, 48, 49, 50, 51, 52], "adv": 75, "advanc": [31, 47, 77], "advantaeg": [12, 76], "advantag": [12, 75, 76], "adversari": [15, 16, 17, 18, 54, 57, 58, 62, 63], "adversary_0": [56, 58, 62, 63], "adversary_1": [62, 63], "adversary_2": 62, "adversary_3": 63, "aec": [3, 4, 5, 8, 9, 10, 69, 70, 83, 87, 88, 90, 91, 92, 93], "aec_env": 6, "aec_rp": 10, "aec_to_parallel": [6, 70], "aec_to_parallel_wrapp": 6, "aec_wrapper_fn": 70, "aecenv": [4, 6, 10], "affect": [35, 47, 54], "after": [2, 4, 9, 10, 11, 16, 17, 18, 20, 25, 27, 34, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 66, 67, 70, 79, 80, 86, 87, 89, 90, 92, 93], "again": [10, 34, 71], "against": [37, 68, 71, 90, 92], "agent": [2, 3, 6, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 74, 75, 76, 77, 78, 79, 80, 88, 90, 91, 92, 93, 94, 95, 96], "agent1": 10, "agent2": 10, "agent_0": [55, 56, 58, 59, 61, 62, 63], "agent_1": [10, 56, 59, 61, 63], "agent_2": [10, 61], "agent_3": 10, "agent_id": [72, 73, 87, 94], "agent_indicator_v0": [8, 75], "agent_it": [2, 4, 6, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 86, 87, 89, 90, 92, 93], "agent_learn": [94, 97], "agent_mask": [72, 73], "agent_nam": [47, 86], "agent_name_map": 10, "agent_oppon": [94, 97], "agent_ord": 4, "agent_reward": [72, 73], "agent_select": [2, 4, 6, 9, 10, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 79, 80, 90], "agent_selector": 4, "agent_three_count": 71, "agent_warm_up": 71, "agentid": [2, 3, 4, 6, 70], "agentselector": [4, 10], "agilerl": 70, "agilerl_dqn_curriculum": 71, "ai": 43, "aim": [46, 71], "al": [8, 13], "alg_nam": 87, "algo": [12, 71, 72, 73, 75, 76], "algorithm": [2, 8, 12, 68, 71, 72, 73, 74, 75, 76, 77, 87, 88, 89, 91, 96], "alic": 57, "alice_0": 57, "alices_comm": 57, "alien": 30, "all": [2, 3, 4, 6, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 59, 61, 63, 64, 65, 66, 67, 70, 71, 78, 79, 85, 86, 90, 91], "all_ag": 4, "all_environ": 70, "all_landmark_rel_posit": [58, 59, 60], "all_modul": 70, "alli": 66, "alloc": [6, 10, 65, 67], "allow": [1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 22, 25, 47, 49, 52, 54, 70, 71, 72, 73, 74, 77, 79, 80, 90, 91, 92], "alogorithm": [72, 73], "along": [4, 8, 39, 43, 78], "alpha": 71, "alphachesszero": 43, "alphazero": [43, 46], "alreadi": [9, 10, 26, 66, 80], "also": [2, 4, 8, 9, 10, 14, 15, 18, 22, 27, 28, 29, 30, 33, 34, 35, 40, 47, 54, 62, 65, 66, 67, 68, 70, 71, 86, 90], "alter": 71, "altern": [3, 22, 71], "alternating_control": 30, "although": 71, "alwai": [39, 40, 41, 43, 54, 59, 61, 70, 71, 90], "among": [65, 66, 67, 86], "amount": [9, 41, 51], "an": [2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 79, 80, 85, 86, 88, 90, 91, 92, 93, 96], "analog": [8, 11], "analyt": 70, "ananth": 8, "andrea": 70, "andrewrwilliam": 70, "andrewtanj": 70, "angl": [39, 40, 65], "angle_nois": 65, "angri": 41, "angular": [41, 65], "ani": [2, 4, 6, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 63, 65, 66, 67, 70, 71, 72, 73, 75, 76, 78, 79, 80, 81, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "anneal": [75, 87], "anneal_lr": 75, "annoi": 70, "annot": [92, 93], "announc": 70, "anoth": [8, 9, 47, 48, 51, 54, 81, 90], "ansi": [2, 3, 6, 9, 10, 11, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67], "answer": 85, "anyon": 83, "anyth": 8, "anywai": 30, "anywher": 66, "apart": 54, "api": [4, 5, 6, 10, 12, 68, 69, 70, 74, 76, 79, 80, 90, 93, 96], "api_test": [2, 11], "apologi": 70, "appear": [20, 41], "append": [8, 9, 47, 71, 72, 73, 86, 89, 90], "append_imag": 89, "appli": [2, 5, 6, 8, 10, 41, 59, 61, 65, 66, 67, 71, 92], "applic": [49, 73, 85, 86, 88], "approach": [13, 43], "appropri": [3, 15, 39, 65], "approx": [12, 75, 76], "approx_kl": [12, 75, 76], "ar": [2, 3, 4, 6, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 73, 75, 76, 78, 79, 80, 83, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "arang": [12, 71, 75, 76], "arbitrari": [2, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70], "arc": 40, "arcad": [8, 13, 34, 68], "arch": [71, 72, 73], "archea": 67, "archer": [2, 4, 38, 70, 91], "archer_0": [40, 92], "archer_1": 40, "architectur": [71, 72, 73], "area": [8, 22, 29, 33, 35, 54, 62, 71, 85], "arg": [4, 65, 66, 67, 70, 75, 87, 89, 94], "argmin": 71, "argpars": [75, 87, 89, 94], "argument": [8, 9, 10, 11, 12, 13, 16, 38, 42, 54, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 94], "argumentpars": [75, 87, 89, 94], "arial": 71, "around": [3, 6, 10, 15, 16, 17, 19, 20, 23, 24, 31, 40, 54, 65, 66, 70, 71, 93], "arrai": [2, 3, 8, 9, 10, 12, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 71, 76, 86], "arrow": [39, 40, 66], "art": [70, 91], "articl": [8, 13, 42, 54], "artifact": 70, "artifici": 13, "arxiv": [8, 13, 42, 54], "as_vector": 47, "ascii": 70, "ask": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "aspect": [9, 30, 32, 37], "assert": [6, 11, 70, 75, 90], "assertoutofbound": 70, "assertoutofboundswrapp": [6, 10], "assess": 7, "assign": [8, 71, 72, 73, 90], "assist": 85, "assort": 4, "assum": [81, 90], "assumpt": [6, 90], "astyp": 71, "atari": [8, 9, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 70, 71, 72, 73, 74, 75, 76, 77], "attack": [37, 40], "attempt": [65, 67, 86], "attr": 70, "attribut": [4, 6, 9, 10, 70, 79, 80], "attributeerror": 6, "author": [7, 8, 12, 13, 42, 54, 64, 71, 72, 73, 75, 76, 87, 89, 90, 92, 93, 94, 95, 97], "auto": [27, 68], "auto_rom_install_path": 13, "autobuild": 1, "autodepr": 70, "autom": 70, "automat": [1, 2, 9, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 65, 66, 67, 70, 90], "autonom": [64, 68], "autorom": [13, 75], "avail": [8, 43, 44, 45, 46, 47, 48, 50, 51, 52, 71, 87], "averag": [20, 56, 59, 65, 67, 70, 93], "average_total_reward": 4, "avg": [72, 73, 92, 93], "avg_reward": [92, 93], "avg_reward_per_ag": 92, "aviv": 54, "avoid": [19, 20, 30, 32, 61, 67, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "awai": [10, 29, 35, 58], "awar": [24, 37], "award": [44, 45, 47], "awhil": 27, "axelbr": 70, "axi": [12, 71, 76], "b": [1, 8, 43, 71, 72, 75, 89, 92], "b_action": [12, 75, 76], "b_advantag": [12, 75, 76], "b_ind": 75, "b_index": [12, 76], "b_logprob": [12, 75, 76], "b_ob": [12, 75, 76], "b_return": [12, 75, 76], "b_valu": [12, 75, 76], "back": [6, 10, 17, 21, 25, 30, 43, 46, 70], "backend": 75, "backgammon": [7, 70], "backup_polici": 4, "backward": [12, 40, 75, 76], "bad": [27, 70], "badg": 70, "balanc": [41, 46, 49, 71], "ball": [14, 22, 28, 29, 33, 35, 36, 39, 41, 63, 70], "ball_elast": [41, 89], "ball_frict": [41, 89], "ball_mass": [41, 89], "ball_spe": [9, 39], "bamboofungu": 70, "bare": 11, "barrier": 67, "base": [2, 3, 4, 6, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 41, 42, 44, 47, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 67, 68, 69, 70, 71, 72, 86], "base_class": [75, 92, 93], "base_env": 9, "baselin": [4, 8, 13], "baselines3": [70, 90, 92, 93], "basenam": 75, "baseparallelwrap": 70, "baseparallelwrapp": [6, 70], "basepolici": [94, 97], "basewrapp": [6, 90], "basic": [12, 26, 76, 79, 96], "basketbal": [13, 18], "basketball_pong": [14, 70], "basketball_pong_v3": [14, 28], "batch": [12, 71, 72, 73, 75, 76, 91, 94, 97], "batch_index": [12, 76], "batch_ob": 87, "batch_siz": [12, 71, 72, 73, 75, 76, 92, 93, 94, 97], "batched_act": 87, "batchifi": [12, 76], "batchify_ob": [12, 76], "battl": [21, 22, 29, 35, 37], "battlefield": 70, "beat": [49, 71], "becaus": [9, 10, 18, 20, 27, 47, 86, 90], "becom": [8, 9, 71], "been": [8, 9, 13, 26, 30, 43, 44, 47, 52, 66, 67, 70, 75, 90, 92, 93], "befor": [2, 4, 6, 8, 9, 10, 26, 27, 40, 42, 43, 70, 71, 78], "before_sleep": 86, "begin": [2, 18, 47, 48, 51, 57], "beginn": 70, "behav": 90, "behavior": [2, 6, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 41, 70], "behind": 32, "being": [8, 9, 16, 35, 40, 47, 49, 54, 62, 63, 66, 67, 70, 80], "bellemar": 13, "bellemare13arcad": 13, "belong": [29, 67], "below": [6, 10, 11, 13, 24, 25, 41, 43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 71, 72, 73, 75, 76, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "benchmark": [64, 74, 77], "benefit": 37, "benjamin": [8, 13], "bertranddecost": 70, "best": [48, 71, 81], "best_act": 71, "best_fit": 71, "bet": [48, 51], "beta": [71, 85], "better": [8, 70, 71, 90], "between": [2, 3, 5, 6, 8, 10, 22, 23, 27, 30, 37, 40, 41, 54, 70, 71, 85, 86, 90, 96], "betwenen": 95, "beyond": [54, 65, 67, 85], "bi": 16, "bia": [12, 73, 75, 76], "bias": [71, 75, 77], "bias_const": [12, 75, 76], "biggest": 8, "billiard": 17, "billiard_hit": 17, "bin": 13, "binari": [42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70], "biped": 65, "bird": 41, "bishop": 43, "bit": [13, 47, 57], "bitter": 71, "bkrl": 70, "black": [8, 13, 40, 43, 46, 62, 67, 70, 92], "black_0": 46, "black_death": 92, "black_death_v2": 8, "black_death_v3": 92, "blank": [71, 92], "blast": 17, "blizzard": 68, "blob": 75, "block": [26, 54, 62, 71, 72, 73, 80], "block_vert_coef": 71, "blockad": 26, "blog": [12, 75, 76, 91], "blue": [47, 63, 66], "board": [7, 22, 27, 43, 46, 52, 68, 70, 71, 80, 90], "board_histori": 43, "board_siz": [46, 90], "board_valu": 71, "boast": 96, "bob": [54, 57], "bob_0": 57, "bodi": 40, "bolundai0216": 70, "bomb": [21, 30], "bomberman": 68, "bonu": [25, 30], "booktitl": 64, "bool": [2, 3, 4, 45, 47, 71, 75], "boolean": 50, "bootstrap": [12, 75, 76], "border": [40, 41, 54], "bot": 68, "both": [4, 5, 6, 8, 10, 20, 21, 23, 25, 27, 32, 37, 41, 43, 44, 45, 46, 47, 49, 51, 52, 54, 57, 59, 67, 70, 74, 79, 83, 91], "both_dir": 71, "bottom": [40, 44, 54, 79, 81], "bounc": [17, 41], "bounce_random": [9, 39], "bound": [6, 8, 39, 62, 63], "bowl": 13, "box": [2, 8, 13, 55, 56, 57, 58, 59, 60, 61, 62, 63, 66, 87], "boxing_v2": 15, "bracket": 70, "break": [2, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 40, 70, 71, 72, 73, 75, 76, 90, 92, 93], "breakdown": 40, "bro": 13, "broadcast": 54, "broken": 70, "brought": 70, "buffer": [71, 72, 73, 94], "buffer_s": 94, "buffer_warm_up": 71, "bug": [2, 11, 39, 40, 43, 44, 45, 46, 47, 48, 50, 51, 52, 64, 65, 66, 67, 70], "bugfix": 70, "buggi": 70, "build": 96, "built": 81, "bullet": [16, 17, 31, 37, 68], "bump": [40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 70, 80], "bunch": 70, "butterfli": [3, 4, 6, 9, 10, 11, 12, 39, 40, 41, 69, 70, 75, 76, 87, 89, 92], "button": 34, "c": [13, 43, 70, 71, 72, 73], "cach": [10, 11, 70, 79, 80], "cake": 39, "cake_paddl": [9, 39], "calcul": [4, 12, 47, 70, 71, 75, 76], "call": [2, 4, 6, 8, 9, 10, 11, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 79, 80, 85, 90], "callabl": 97, "callback": [94, 97], "can": [1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 57, 60, 61, 63, 64, 65, 66, 67, 68, 69, 70, 75, 79, 80, 81, 85, 86, 90, 91, 92, 93, 94, 97], "cannot": [2, 3, 4, 9, 14, 27, 40, 44, 47, 54, 57, 60, 68, 70], "cao": 42, "cap": 65, "capabililti": 70, "capabl": [43, 69], "captur": [6, 13, 26, 27, 34, 43, 46, 67, 75], "capture_stdout": 4, "capture_video": 75, "capturestdoutwrapp": [4, 6, 10], "card": [42, 45, 47, 48, 50, 51, 68], "card_knowledg": 47, "cardin": [54, 79], "care": [24, 26, 37], "carefulli": 10, "carla": 70, "carri": 65, "cartesian": [59, 63], "case": [2, 6, 9, 65, 70, 78], "cast": [70, 90], "castl": 43, "catch": [66, 70, 79], "catch_reward": 66, "categor": [12, 75, 76], "cathedr": 70, "caught": [2, 66], "caus": [2, 65, 70, 90], "cd": 1, "cell": [44, 52, 80], "center": [39, 40, 66], "central": [3, 39, 65, 72], "certain": [8, 9, 54, 70, 71, 80], "cff": 70, "challeng": [38, 39, 68], "champion": 71, "chanc": [2, 8], "chang": [1, 2, 3, 4, 6, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 46, 47, 65, 66, 67, 70, 71, 75, 79, 80, 87, 90], "changeabl": 9, "changelog": 70, "channel": [8, 12, 43, 54, 57, 66, 70, 71, 72, 73, 76, 92], "channel_s": [71, 72], "channels_last": [72, 73], "chart": 75, "chase": 63, "chat_model": 86, "chatopenai": 86, "check": [4, 6, 11, 21, 43, 48, 50, 51, 57, 70, 71, 72, 73, 74, 75, 79, 80], "check_for_winn": 70, "check_three_in_row": 71, "check_vertical_win": 71, "check_winn": 71, "checker": [13, 70], "checkpoint": [71, 87, 89], "checkpoint_000050": [87, 89], "checkpoint_freq": [87, 89], "checkpoint_path": [87, 89], "chess": [1, 2, 7, 42, 68, 70, 71, 80, 88, 90], "chess_v5": 70, "chess_v6": [2, 43, 70, 90], "chicken": 68, "chines": 46, "chip": [48, 50, 51], "chipmunk": 41, "choic": [18, 49, 71, 94], "choos": [2, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 49, 54, 67, 71, 85], "chosen": [4, 8, 65, 86], "chrisyeh96": 70, "ci": [70, 87, 89, 90], "cibeah": 70, "circl": [54, 62], "circular": 54, "circumst": 9, "citat": 70, "cite": [7, 8, 42, 45, 48, 51, 54, 64], "cl": 86, "clamp": [12, 75, 76, 87], "class": [2, 3, 4, 6, 8, 10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 75, 76, 78, 79, 80, 86, 87, 89, 90], "classic": [1, 2, 3, 6, 17, 27, 28, 30, 34, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 68, 70, 71, 72, 73, 86, 87, 89, 94, 95, 97], "classmethod": 86, "clean": [12, 54, 70, 76, 91], "cleanrl": [12, 70, 94, 97], "cleanup": [40, 70], "clear": [30, 37, 70], "cli": [70, 75, 77, 96], "clip": [6, 8, 12, 75, 76], "clip_act": 89, "clip_actions_v0": 8, "clip_coef": [12, 75, 76], "clip_frac": [12, 76], "clip_grad_norm_": 75, "clip_param": 89, "clip_reward_v0": [8, 72, 75], "clip_vloss": 75, "clipfrac": 75, "clipoutofboundswrapp": [6, 10], "clock": [10, 43, 79, 80], "clockwis": 40, "clone": [71, 75], "close": [2, 3, 6, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 70, 71, 72, 73, 75, 86, 89, 90, 92, 93], "closer": [2, 59], "closest": [56, 61], "club": [45, 50, 51], "cnn": [71, 72, 91, 92, 93], "cnnmodelv2": 89, "cnnpolici": 92, "co": [70, 74], "code": [1, 2, 6, 9, 10, 12, 40, 54, 64, 65, 70, 91, 96], "codebas": 54, "codeblock": 70, "coef": 75, "coeffici": [71, 75], "coin": 25, "col": 71, "collabor": 25, "collect": [8, 10, 12, 25, 66, 71, 72, 73, 76, 85, 86, 94, 95, 97], "collector": [94, 95, 97], "collid": [40, 61, 67], "collis": [39, 61, 62, 63, 65, 70], "color": [5, 8, 27, 43, 47, 54, 56, 59, 71, 92], "color_reduction_v0": [8, 12, 72, 75, 76, 89, 92], "column": [41, 43, 44, 45, 70, 71], "column_count": 71, "column_piec": 71, "com": [7, 12, 64, 70, 71, 72, 73, 75, 76, 87, 89, 90, 92, 93, 94, 95, 97], "combat": [13, 31], "combat_jet_v1": 16, "combat_plan": 16, "combat_plane_v2": 16, "combat_tank": 17, "combat_tank_v2": 17, "combat_tank_v3": 17, "combin": [6, 18, 41, 43, 45, 54, 70], "combined_arm": 70, "come": [8, 32], "comm": 54, "command": 1, "comment": [10, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "commit": 70, "common": [4, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 47, 49, 70, 75, 85, 90, 94, 97], "commonli": [5, 7, 9], "commun": [42, 47, 48, 50, 51, 54, 57, 59, 60, 61, 63], "companion": [8, 10], "compar": [64, 73, 74], "comparison": [3, 70], "compass": 43, "compat": [5, 13, 47, 68, 70, 90], "compens": 46, "compet": [7, 71], "competit": [7, 13, 14, 23, 26, 28, 30, 31, 32, 33, 37, 42, 54, 67, 71, 72, 74], "complet": [11, 47, 66, 70, 81, 94], "complex": [10, 16, 47, 68, 72, 85], "compli": 70, "complianc": 11, "complic": [71, 78], "compon": [71, 72, 73], "compos": [54, 65, 85], "composit": 54, "comprehens": 96, "compris": 13, "comput": [2, 9, 12, 13, 39, 40, 45, 46, 67, 71, 76, 87, 90], "computation": 8, "compute_actions_from_input_dict": 87, "compute_single_act": 89, "concat_vec_envs_v1": [75, 92, 93], "concaten": [8, 71], "concatvecenv": 70, "concept": [71, 78], "condit": [2, 9, 47, 70, 71, 79, 80], "confer": 64, "config": [70, 75, 87, 89], "configur": [9, 38, 47, 71, 72, 73], "confin": 68, "conflict": [68, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "confus": [26, 70], "connect": [2, 10, 39, 40, 41, 42, 43, 46, 47, 49, 52, 65, 66, 67, 70, 74, 88, 91], "connect_four": [44, 71, 90], "connect_four_": 71, "connect_four_v3": [42, 44, 71, 90], "consequ": 91, "conserv": 32, "consid": [2, 9, 41, 66, 71], "consider": 71, "consist": [11, 43, 54, 70, 79], "consol": [8, 13, 47], "const": 75, "constant": [8, 10, 11, 40, 79, 80, 92], "constant_": [12, 75, 76], "constantli": [19, 20], "constraint_window": 66, "construct": [47, 95], "constructor": [9, 87], "consum": 67, "cont_act": [72, 73], "contact": 65, "contain": [1, 9, 10, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 65, 70, 71, 86], "content": [70, 71, 86], "continu": [6, 8, 12, 32, 41, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 70, 71, 72, 73, 76, 78, 89], "continuous_act": [54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 73], "contrast": 2, "contrib": 90, "contribut": [1, 41, 68, 70], "contributor": 70, "control": [2, 8, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 67, 70, 78, 91], "conv2d": [12, 75, 76, 89], "convei": 57, "conveni": [5, 6, 10, 43], "converg": 72, "convers": [5, 68, 70, 79, 80], "convert": [2, 3, 5, 6, 8, 10, 12, 70, 76, 90, 95], "convolut": [43, 72], "cook": 68, "cooper": [7, 8, 13, 30, 37, 38, 41, 47, 54, 64, 67, 70, 72, 93], "cooperative_pong": 39, "cooperative_pong_v5": [9, 39], "coordin": [20, 22, 29, 35, 38, 41, 43, 46, 63, 66, 67, 79, 80], "copi": [71, 79, 80, 94], "core": 70, "corner": [40, 46, 79], "correct": [11, 60, 70], "correctli": [2, 3], "correspond": [2, 8, 9, 10, 26, 40, 43, 44, 48, 52, 67], "costa": 75, "could": [2, 3, 9, 47, 51, 71], "count": [10, 17, 43, 45, 66, 71], "counter": [40, 71, 72, 73], "coupl": 13, "cours": 9, "court": 14, "cover": [56, 61], "cpu": [12, 71, 72, 73, 75, 76, 90, 92, 94, 97], "craft": 71, "crash": [11, 40], "craze": 13, "crazyfli": 68, "creat": [2, 3, 4, 6, 9, 10, 11, 26, 38, 47, 64, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 83, 85, 87, 89, 90, 91, 92, 93, 94, 95, 97], "creation": [9, 70, 83], "criteria": 71, "critic": [12, 41, 54, 70, 72, 73, 75, 76], "crop": 8, "crt": 8, "crypto": 54, "cuda": [12, 71, 72, 73, 75, 76, 94, 97], "cudnn": 75, "cumul": [8, 9], "current": [2, 3, 4, 6, 8, 9, 10, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 68, 70, 79, 80, 86, 90], "current_ag": 90, "curriculum": [70, 74], "curriculumenv": 71, "cursor": [27, 34], "custom": [2, 3, 4, 69, 70, 78, 79, 80, 81, 90], "custom_environ": [78, 79, 80, 81], "custom_environment_v0": [78, 79, 80], "custom_model": 87, "custom_test": 11, "customactionmaskedenviron": [80, 81], "customenviron": [78, 79, 81], "cycl": [2, 3, 4, 6, 9, 10, 40, 54, 66, 70, 79, 80], "cyclic": 10, "d": [40, 41, 43, 68, 71, 90, 92, 93], "d0": 71, "d1": 71, "danger": [19, 20], "daochen": 42, "data": [4, 10, 12, 47, 65, 70, 75, 76, 94, 95, 97], "databas": 86, "date": 10, "datetim": 71, "ddpg": 72, "dead": [8, 10, 19, 20, 45, 70, 92], "deadwood": 45, "deadwood_count": 45, "deal": 13, "death": [8, 19, 20, 24, 25, 26, 36, 37, 40, 65, 70, 92], "debug": [10, 11, 55, 87, 89], "decai": [71, 72, 73], "deceiv": 56, "decent": 90, "decentr": [3, 39, 65, 72], "decept": 7, "decid": [46, 71], "decis": [71, 85], "deck": [45, 47, 48, 51], "declar": [1, 10, 45], "deep": [8, 64, 71, 72, 73, 74, 87, 94, 96, 97], "deepcopi": [71, 94], "deepmind": [2, 68, 71], "def": [10, 12, 62, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 97], "default": [2, 3, 4, 8, 9, 10, 13, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 75, 90, 94], "default_output_kei": 86, "defeat": 49, "defend": [22, 29, 36], "defens": 23, "defin": [8, 10, 11, 45, 46, 47, 71, 72, 73, 79, 80, 86, 90, 95], "definit": [2, 70, 71], "degre": 38, "delai": [8, 73], "delay_observations_v0": 8, "delet": [70, 71], "deliber": 71, "delta": [12, 75, 76], "demo": [68, 70, 71, 72, 73, 90, 92, 93], "demonstr": [70, 71, 86, 91, 95], "dendrit": 67, "dep": 70, "depend": [2, 9, 13, 18, 30, 37, 38, 42, 46, 47, 54, 64, 65, 67, 70, 71, 72, 73, 75, 76, 78, 86, 87, 89, 90, 92, 93, 94, 95, 97], "dependabot": 70, "depict": [50, 66, 67], "deploy": 78, "deprec": [4, 70, 79, 80], "deprecated_modul": 10, "deprecatedenv": 10, "deprecatedmodul": 10, "depreci": [68, 78], "depric": 70, "dequ": [71, 86], "deriv": 68, "describ": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 63, 66, 78], "descript": [45, 46, 47, 48, 50, 51, 65, 67, 68, 87, 89], "design": [2, 10, 12, 20, 68, 71, 72, 73, 75, 76, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "desir": [4, 71], "despit": 13, "destin": 54, "destroi": 67, "detail": [3, 45, 48, 51, 54, 91], "detect": [2, 11, 67, 90], "determin": [11, 13, 49, 71, 72, 73, 90], "determinist": [8, 11, 13, 72, 73, 75, 90, 92, 93], "dev": 75, "develop": [2, 3, 13, 68, 70, 85], "devic": [12, 71, 72, 73, 75, 76, 94, 97], "di": [9, 19], "diagon": [27, 43, 44, 52, 71], "diagram": 70, "diamond": [45, 50, 51], "dict": [2, 3, 9, 10, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 70, 71, 92, 94, 97], "dictat": 70, "dictionari": [3, 9, 10, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 72, 73], "did": 90, "die": [8, 9, 40, 92], "differ": [2, 3, 6, 11, 24, 27, 42, 45, 47, 49, 54, 58, 59, 66, 71, 85, 86], "difficult": [2, 18, 30, 68, 71, 90], "difficulti": 71, "dilemma": 7, "dim": 71, "dimens": [71, 72, 73], "dimension": [43, 90, 92, 93], "direct": [16, 21, 39, 40, 41, 43, 54, 67, 70, 71, 79], "directli": [2, 9, 23, 33, 41, 47, 64, 91], "directori": [4, 10, 70, 81], "dirhtml": 1, "dirnam": 71, "disabl": [10, 11, 70, 79, 80, 90], "disadvantag": 46, "disallow": 6, "disappear": 26, "discard": [45, 47], "discord": [68, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "discount": [71, 72, 73, 75], "discount_factor": 97, "discourag": 64, "discov": 71, "discret": [2, 8, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 66, 70, 71, 72, 73, 75, 79, 80, 87, 90, 91, 93], "discrete_act": [71, 72, 73], "discuss": 71, "disk": [90, 92, 93], "displai": [2, 3, 10, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 65, 66, 67], "distanc": [21, 40, 54, 55, 56, 58, 59, 61, 63, 67], "distribut": [2, 12, 65, 66, 67, 75, 76, 88], "distutil": 75, "diverg": 75, "divid": [20, 41, 90], "dm_control": 7, "dm_control_multiagent_compat": 7, "dm_soccer": 7, "dmcontrolmultiagentcompatibilityv0": 7, "dmytroivasiuk": 70, "do": [6, 8, 9, 11, 13, 40, 44, 54, 67, 68, 71, 75, 85, 86, 90, 91], "doc": [10, 70, 75, 78, 86], "docstr": 70, "doctest": 70, "document": [2, 3, 4, 7, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 45, 48, 51, 54, 56, 65, 70, 71, 72, 73, 74, 75, 77, 78, 79, 80, 83, 86, 87, 88, 89, 90, 92, 93, 96], "doe": [2, 4, 6, 8, 9, 11, 14, 18, 22, 27, 28, 29, 33, 34, 35, 47, 86, 90, 91, 92], "doesn": [56, 70, 90], "domain": [70, 73], "don": [8, 33, 62, 90], "done": [12, 25, 26, 36, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 75, 76, 85, 95], "door": 79, "doubl": [13, 71], "double_dunk": 18, "double_dunk_v3": 18, "doudizhu": 70, "down": [8, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 66, 67, 71, 79, 80], "downleft": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37], "downright": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37], "downscal": 13, "downstream": 9, "dqn": [70, 74, 88, 94, 96, 97], "dqn_torch_model": 87, "dqnagent": 87, "dqnconfig": 87, "dqnpolici": [94, 97], "dqntorchmodel": 87, "draft": 90, "draw": [43, 44, 45, 49, 52, 71, 72, 73], "drawer": [71, 72, 73], "drawn": 47, "drive": 68, "drop": [44, 47, 70], "dsctt": 70, "dtype": [8, 10, 71, 80, 86], "dtype_v0": [8, 89], "due": [8, 11, 13, 41, 43, 44, 46, 47, 49, 52, 68, 70], "duel": 87, "duke": 15, "dummi": [32, 79, 80, 87, 89], "dummyvectorenv": [94, 95, 97], "dunk": 13, "duplic": [13, 70], "durat": [65, 71, 72, 73, 89], "dure": [4, 9, 11, 70, 94], "dylwil3": 70, "dynam": [2, 4, 67], "dynamic_resc": [55, 56, 57, 58, 59, 60, 61, 62, 63], "e": [1, 2, 3, 6, 8, 9, 30, 40, 41, 43, 54, 65, 70, 71, 79, 80, 81, 86], "each": [2, 3, 9, 10, 12, 13, 15, 18, 20, 22, 25, 26, 27, 29, 30, 35, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 75, 76, 78, 79, 80, 90, 92, 93, 95], "earlier": [71, 90, 94], "earn": [24, 25], "easi": [4, 6, 10, 71, 92], "easier": [47, 70, 75], "easili": [19, 20, 71, 90], "easy_env": 90, "edg": [39, 40, 43, 65], "effect": [20, 21, 80], "effici": 6, "efg": [2, 70], "egorov": 64, "eight": 43, "either": [2, 4, 14, 21, 22, 25, 28, 35, 39, 40, 41, 44, 46, 47, 49, 52, 70], "elast": [39, 41], "elect": 71, "element": [8, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 67, 70], "elif": [2, 38, 71, 79, 80], "elit": [71, 72, 73], "elite_opp": 71, "elliot": [7, 75, 90, 92, 93], "elliottow": [70, 75, 90, 92, 93], "els": [2, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 71, 72, 73, 74, 75, 76, 86, 87, 89, 90, 92, 93, 94, 97], "elsewher": 10, "em": [70, 86, 87], "embed": 87, "emerg": [38, 41, 54], "emit": 6, "empti": [9, 10, 44, 46, 70], "en": [43, 70, 90, 92, 93], "enabl": [8, 26, 40, 67, 70, 71, 72, 73, 75, 90], "encod": [8, 43, 46, 47, 48, 49, 52], "encounter_reward": 67, "encourag": [9, 11, 13, 70, 71], "encrypt": 57, "end": [2, 3, 6, 12, 13, 15, 19, 20, 30, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 67, 70, 71, 75, 76, 85, 90], "end_dim": [12, 76], "end_step": [12, 76], "enemi": 24, "enforc": [6, 70], "engin": [41, 68, 70, 71, 91, 96], "enh": 70, "enhanc": 72, "enough": [2, 11], "ensur": [1, 9, 45, 70, 71], "ent": 75, "ent_coef": [12, 75, 76], "entir": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 45, 70], "entireti": 78, "entiti": [40, 67, 75], "entomb": [13, 19, 20], "entombed_competit": 19, "entombed_competitive_v3": 19, "entombed_coop": [20, 70], "entombed_cooperative_v3": 20, "entri": [9, 10, 48, 50, 51], "entropi": [12, 75, 76], "entropy_coeff": 89, "entropy_loss": [12, 75, 76], "enumer": [12, 65, 67, 71, 75, 76], "env": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 81, 86, 87, 88, 89, 90, 92, 93, 94, 95, 97], "env_creat": [87, 89], "env_defined_act": [72, 73], "env_don": 70, "env_fn": [11, 90, 92, 93], "env_func": 11, "env_id": 75, "env_kwarg": [90, 92, 93], "env_logg": 4, "env_max": [8, 89], "env_min": [8, 89], "env_nam": [87, 89], "env_reward": 71, "env_step": [94, 97], "env_trunc": 10, "environ": [2, 3, 4, 5, 6, 8, 12, 38, 39, 40, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 74, 77, 78, 80, 85, 91], "environment_paramet": 9, "environmentcr": 70, "ep": [12, 71, 72, 73, 75, 76, 94], "episod": [4, 12, 40, 57, 70, 71, 72, 73, 74, 75, 76, 95], "episode_num": [71, 72, 73], "episode_per_test": 97, "episodes_per_epoch": 71, "episodic_length": 75, "episodic_return": 75, "epoch": [71, 75, 94, 97], "eps_decai": [71, 72, 73], "eps_end": [71, 72, 73], "eps_test": 94, "eps_train": 94, "epsilon": [71, 72, 73, 87], "epsilon_timestep": 87, "epsilongreedi": 87, "equal": [42, 45, 47, 65, 71], "equival": [2, 3, 6, 8, 9], "erik": 13, "error": [2, 4, 6, 9, 10, 11, 47, 70, 71, 87, 89], "error_agent_iter_before_reset": 4, "error_nan_act": 4, "error_observe_before_reset": 4, "error_possible_agents_attribute_miss": 4, "error_render_before_reset": 4, "error_state_before_reset": 4, "error_step_before_reset": 4, "escap": [19, 20, 79, 80], "escape_i": [79, 80], "escape_x": [79, 80], "especi": [8, 70], "essenti": [24, 37], "establish": 4, "estim": 75, "estimation_step": 97, "et": [8, 13], "etc": [8, 10, 11, 70, 86], "euclidean": [55, 56, 67], "ev": [54, 57], "evad": 66, "evader_spe": 67, "eval": [12, 71, 76, 92, 93, 94], "eval_action_mask": 90, "eval_actions_dict": 71, "eval_actions_hist": 71, "eval_oppon": 71, "eval_turn": 71, "evalu": [4, 8, 11, 13, 70, 71, 72, 73], "eve_0": 57, "even": [2, 10, 13, 90], "evenli": 67, "eventu": 30, "everi": [1, 2, 3, 6, 9, 13, 41, 63, 66, 67, 70, 71, 93, 95], "everyon": 70, "everyth": [13, 40, 71], "evo": 71, "evo_epoch": [71, 72, 73], "evo_loop": [71, 72, 73], "evo_step": [71, 72, 73], "evohpo": 71, "evolut": [71, 72, 73], "evolutionari": [71, 72, 73, 74], "evolv": [2, 71, 72, 73], "exact": 54, "exactli": 49, "exampl": [1, 4, 6, 11, 13, 43, 45, 46, 47, 49, 67, 70, 71, 75, 79, 80, 83, 85, 86, 87, 90, 91, 92, 94, 95, 97], "exce": 67, "exceed": 70, "exceedingli": [12, 76], "except": [3, 6, 8, 9, 13, 43, 44, 45, 46, 47, 48, 50, 51, 52, 60, 63, 72, 73, 86, 90, 92, 93], "excit": [70, 71], "exclud": 45, "exclus": 2, "execut": [1, 2, 3, 8, 9, 12, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 65, 66, 67, 75, 76, 79, 80, 91, 95], "exert": 65, "exist": [6, 8, 11, 40, 44, 47, 70], "exist_ok": [71, 72, 73, 97], "exit": [26, 33, 62, 87, 89, 90, 92, 93], "exp": [12, 62, 75, 76], "exp_nam": 75, "expand": 70, "expand_dim": [71, 72, 73, 87], "expandus": [87, 89], "expans": [49, 70], "expect": [24, 90, 94], "experi": [71, 72, 73, 75, 77], "experiment": 40, "explain": [12, 76], "explained_var": [12, 75, 76], "explained_vari": 75, "explicitli": [2, 47], "exploit": 71, "explor": [20, 71, 72, 73, 87], "exploration_config": 87, "exploration_nois": [94, 97], "express": 43, "extend": [2, 72, 73, 86, 94], "extens": [2, 13, 71], "extern": [4, 5, 7, 70, 85], "extra": [49, 70], "extract": 87, "extractor": [90, 92, 93], "ezpickl": 70, "f": [12, 40, 43, 71, 72, 73, 75, 76, 79, 80, 86, 90, 92, 93, 94, 97], "f1tenth": 68, "f841": 86, "face": 70, "facilit": 43, "fact": [8, 17], "factor": [9, 41, 65, 67, 71, 72, 73, 75], "fail": [11, 65, 70], "fairli": 27, "fall": [36, 44, 65], "fall_reward": 65, "fallen": 65, "fals": [4, 8, 9, 10, 11, 12, 13, 17, 30, 39, 40, 41, 45, 47, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 92, 94, 97], "famili": 9, "familiar": [7, 18], "fan": 18, "fantast": 9, "far": [20, 47, 58, 61, 86], "farama": [7, 10, 13, 38, 68, 70, 79, 80, 90], "fast": [71, 96], "fast_bomb": 30, "faster": [8, 13, 16, 30, 62, 70, 74], "fastrand": [71, 72, 73], "favicon": 70, "favor": [70, 94], "fcnet": 87, "feat": 71, "featur": [9, 11, 43, 47, 54, 67, 70, 77, 90, 92, 93], "feel": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "fernadoo": 70, "fetch": 85, "few": [8, 10, 13, 18, 42, 68, 91], "ffelten": 70, "field": [17, 71], "field_nam": [71, 72, 73], "fig1": [71, 74], "file": [1, 4, 12, 70, 76, 77, 81, 94], "filenam": [72, 73], "filipinogambino": 70, "fill": [8, 32, 44, 71, 72, 73], "fill_replay_buff": 71, "final": [40, 43, 47, 49, 71, 72, 73, 90, 94], "final_epsilon": 87, "find": [10, 19, 20, 43, 71], "fine": 90, "finish": [70, 71, 90, 92, 93], "finit": 8, "fire": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 40], "firebal": 25, "firework": 47, "first": [2, 4, 6, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 78, 85, 91], "first_0": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "fit": [6, 71, 72, 73], "fix": [16, 19, 20, 24, 25, 26, 27, 29, 34, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 64, 65, 66, 67, 70, 75], "flag": [13, 65, 86], "flag_captur": 21, "flag_capture_v2": 21, "flake8": [70, 75], "flash": [8, 70], "flatten": [8, 12, 43, 71, 75, 76, 89], "flatten_v0": 8, "flexibl": [2, 68], "fli": 30, "flicker": 13, "flight": 16, "flip": [25, 27, 71], "float": [2, 3, 4, 6, 12, 45, 46, 67, 71, 75, 76, 94], "float16": 8, "float32": [8, 86, 89], "float64": 8, "float_max": 87, "floor": [25, 35], "flush": 4, "fly": 16, "fmt": 75, "focus": [71, 74], "fold": [43, 48, 50, 51, 70], "folder": [1, 4, 70, 75], "follow": [1, 2, 3, 5, 6, 8, 9, 10, 13, 27, 43, 46, 47, 48, 49, 50, 51, 52, 54, 62, 68, 70, 71, 72, 73, 74, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "font": 71, "food": [63, 67], "food_reward": 67, "foozbal": 22, "foozpong": [13, 70], "foozpong_v3": 22, "forc": [32, 65], "forest": 63, "forev": [30, 67, 70], "form": [2, 40, 47, 54, 66, 67, 70], "formal": 2, "format": [10, 70, 71, 86, 95], "forth": [10, 30], "fortress": 36, "forward": [40, 80, 87, 89], "forward_reward": 65, "found": [1, 11, 43, 44, 45, 46, 47, 48, 50, 51, 52, 71, 75, 90, 92, 93], "foundat": [7, 13, 68, 70], "four": [13, 22, 29, 35, 36, 40, 42, 54, 70, 74, 78, 79, 88, 91], "fourth_0": [22, 29, 35, 36], "fp": [8, 70], "frac": 75, "fraction": [12, 71, 76], "frame": [3, 5, 8, 9, 13, 18, 34, 43, 46, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 70, 71, 72, 73, 74, 91, 92, 95], "frame_list": 89, "frame_no": 71, "frame_s": [12, 76], "frame_skip": [8, 13], "frame_skip_v0": [8, 13, 72, 75], "frame_stack_v1": [8, 12, 13, 72, 75, 76, 89, 92], "frames_per_second": 70, "frameskip": 8, "framework": [74, 85, 87, 89, 96], "free": [71, 72, 73, 75, 76, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "freeze_evad": 66, "freq": [71, 94], "frequenc": [71, 72, 73], "frequent": 2, "frequneci": 73, "friction": 41, "friendli": [70, 77], "from": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 75, 76, 77, 78, 79, 80, 81, 83, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "from_checkpoint": [87, 89], "from_parallel": [10, 70], "fromarrai": [71, 72, 73, 89], "front": [23, 40, 65, 80], "full": [8, 10, 13, 44, 47, 51, 66, 67, 70, 75, 79, 83, 92, 94, 96], "full_action_spac": 13, "full_column": 71, "fulli": [8, 66, 70], "fullyconnectednetwork": 87, "fun": 79, "function": [2, 4, 5, 6, 9, 10, 11, 39, 40, 41, 43, 44, 45, 46, 47, 49, 52, 62, 63, 65, 66, 67, 68, 70, 71, 72, 73, 75, 78, 86, 87, 90, 94, 97], "functool": [10, 79, 80], "further": [71, 72, 73], "futur": 47, "g": [2, 3, 8, 13, 43, 54, 70, 71, 79, 80, 81], "g1": 43, "gae": 75, "gae_lambda": 75, "gain": 25, "game": [2, 3, 4, 6, 7, 8, 9, 10, 11, 14, 15, 16, 17, 18, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 70, 71, 74, 75, 79, 80, 86, 90, 91, 92, 93, 95, 96], "game_nam": 7, "game_vers": [16, 26, 28], "gamma": [12, 71, 72, 73, 75, 76, 89, 94], "gather": 70, "gen_envs_md": 1, "gener": [1, 2, 3, 7, 8, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 69, 70, 75, 80, 86], "generated_ag": [2, 70], "get": [4, 9, 10, 12, 14, 17, 19, 20, 21, 22, 23, 27, 28, 29, 33, 35, 37, 38, 41, 43, 45, 51, 55, 59, 70, 71, 72, 73, 76, 79, 80, 87, 89, 90, 92, 93, 94], "get_action_and_valu": [12, 75, 76], "get_ag": 94, "get_arg": 94, "get_doc": 86, "get_env": 94, "get_logg": 4, "get_pars": 94, "get_polici": 87, "get_valu": [12, 75, 76], "getact": [71, 72, 73], "getctim": [90, 92, 93], "getcwd": 4, "getmodul": 86, "getvalu": 4, "gg": 70, "gif": [70, 71, 72, 73, 89], "gif_path": [71, 72, 73], "gin": [42, 70], "gin_reward": 45, "gin_rummi": 45, "gin_rummy_v4": [45, 90], "git": [94, 95, 97], "github": [7, 12, 64, 70, 71, 72, 73, 74, 75, 76, 78, 87, 89, 90, 91, 92, 93, 94, 95, 97], "gitlab": 70, "give": [6, 10, 11, 14, 21, 22, 28, 29, 35, 41, 42, 47, 59, 63, 65, 70, 86, 91], "given": [2, 4, 6, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 41, 42, 46, 47, 49, 86], "glitch": 39, "glob": [90, 92, 93], "global": [3, 9, 39, 40, 41, 59, 61, 65, 67], "global_reward": 41, "global_step": [71, 75], "go": [1, 42, 45, 70, 71, 80, 85, 90], "go_v5": [46, 90], "goal": [22, 25, 27, 32, 33, 41, 54, 86], "goal_id": [59, 60], "goal_landmark_id": 58, "goal_rel_posit": [56, 58], "gobblet": 70, "goe": [39, 45, 65], "good": [11, 17, 54, 56, 57, 58, 62, 63, 70], "googl": [68, 70], "gpu": [90, 93], "grad": 75, "grad_clip": 89, "grade": 88, "gradient": [2, 72, 73, 75], "gradio": 68, "grai": 60, "grand": 71, "graph": 2, "graphic": [8, 10, 11], "grayscal": 13, "grayscale_imag": 13, "greater": [49, 51], "greater_equ": 71, "greedi": 27, "greedili": 27, "green": [47, 54, 56, 62, 67], "greyscal": 8, "grid": [40, 44, 52, 66, 68, 79, 80], "gridworld": 3, "ground": [54, 65], "grow": 54, "gt": 70, "gtp": 46, "guarante": 68, "guard": [79, 80], "guard_act": [79, 80], "guard_action_mask": 80, "guard_i": [79, 80], "guard_x": [79, 80], "gui": 70, "guid": [10, 70, 71, 74, 78], "guided_missil": 16, "guo": 42, "gupta": 64, "gupta2017coop": 64, "gym": [2, 3, 13, 70, 75], "gymnasium": [2, 5, 7, 8, 9, 10, 68, 69, 70, 71, 72, 73, 75, 79, 80, 87, 90, 94, 97], "gymnasium_ag": 86, "gymnasiumag": 86, "h": [43, 71, 72, 73, 90, 92, 93], "ha": [4, 8, 9, 11, 12, 13, 18, 22, 25, 26, 30, 40, 43, 44, 46, 47, 52, 58, 59, 61, 66, 67, 70, 71, 74, 75, 76, 81, 90, 92, 93], "had": [10, 66], "half": [39, 49, 51], "halv": 20, "hanabi": [42, 70, 90], "hanabi_v4": 70, "hanabi_v5": [47, 70, 90], "hand": [9, 10, 45, 47, 48, 49, 50, 51, 70], "hand_siz": 47, "handl": [2, 4, 8, 9, 10, 13, 19, 20, 23, 24, 25, 26, 36, 37, 40, 65, 70, 78, 80, 92], "happen": [71, 90], "harb": 54, "hard": [2, 70, 71, 85], "hard_env": 90, "harder": 71, "hardwar": 13, "hari": 8, "has_maz": 17, "hasattr": 94, "hausknecht": 13, "have": [2, 3, 4, 6, 8, 9, 11, 12, 13, 15, 17, 18, 26, 27, 37, 42, 43, 44, 47, 49, 54, 56, 57, 65, 66, 67, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "he": 93, "head": [40, 65], "hear": 54, "heart": [45, 50, 51], "hearthston": 68, "heavili": 90, "height": [12, 40, 41, 71, 76], "held": 34, "help": [9, 10, 20, 25, 43, 63, 69, 70, 71, 72, 73, 75, 76, 85, 86, 87, 89, 90, 92, 93, 94, 95, 97], "helper": [4, 78], "helpingstar": 70, "here": [10, 13, 71, 79, 80, 86, 92, 95], "herng": 42, "heterogen": 8, "heurist": 27, "hidden": [12, 21, 54, 71, 72, 73, 75, 76, 87, 94], "hidden_s": [71, 72, 73, 94, 97], "hide": 63, "high": [8, 9, 30, 38, 61, 72, 73, 77, 87, 96], "higher": [32, 35, 40, 41, 71], "highest": 71, "highli": [8, 9, 38, 41, 70, 77], "hint": [21, 47, 70, 96], "hip": 65, "histogram": 71, "hit": [4, 16, 17, 24, 25, 27, 30, 31, 36, 37, 40, 62], "hoard": 30, "hockei": 13, "hoffmann": 70, "hold": [10, 18, 43, 44, 45, 46, 47, 52, 70, 79, 80, 86, 87, 90], "holdem": [42, 70, 87, 88, 90], "homepag": 70, "homogen": 8, "hook": 70, "hoop": 14, "hope": 13, "hopefulli": 70, "horizont": [44, 52, 65, 67, 71], "horizontal_thrust": 67, "hot": [8, 47], "hotfix": 70, "hour": 70, "hover": 34, "how": [1, 2, 11, 19, 20, 24, 25, 26, 30, 36, 37, 39, 40, 41, 46, 54, 55, 56, 61, 65, 70, 71, 72, 73, 75, 76, 77, 80, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 97], "howev": [2, 9, 24, 29, 30, 47, 49, 71, 86], "hpo": [71, 72, 73, 74], "html": [12, 53, 75, 76, 90, 92, 93], "http": [7, 10, 12, 64, 70, 71, 72, 73, 75, 76, 79, 80, 87, 89, 90, 91, 92, 93, 94, 95, 97], "hu": 42, "huang": [2, 42], "huge": 11, "huggingfac": [68, 70], "hull": 65, "human": [2, 3, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 71, 76, 86, 90, 92, 93, 94, 95], "humanmessag": 86, "hunt": 68, "hyper": [71, 72, 73, 74], "hyperparam": [71, 72, 73], "hyperparamet": [71, 72, 73, 75, 77, 90], "i": [1, 2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 74, 75, 76, 77, 78, 79, 80, 81, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97], "ic": 13, "ice_hockei": 23, "ice_hockey_v2": 23, "iclr": 91, "id": [8, 9, 10, 45, 46, 47, 48, 50, 51, 72, 73, 75, 94], "ideal": 13, "ident": [20, 26], "identifi": [8, 13, 43, 54, 86], "idx": 75, "idx_epi": [71, 72, 73], "idx_step": 71, "ignor": 8, "igor": 54, "illeg": [2, 4, 6, 9, 10, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 71, 86, 90], "illegal_reward": [6, 7], "im": [71, 72, 73], "imag": [4, 8, 13, 41, 43, 70, 71, 72, 73, 89], "imagedraw": [71, 72, 73], "imagefont": 71, "imageio": [71, 72, 73], "imagin": 71, "img": [71, 89], "img_res": 71, "immedi": [20, 65, 71], "impact": 70, "implement": [2, 3, 6, 7, 8, 9, 11, 13, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 52, 65, 66, 67, 68, 70, 74, 77, 78, 83, 85, 86, 88, 91], "impli": 9, "import": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 72, 73, 75, 76, 78, 79, 80, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "import_modul": 75, "importlib": 75, "importorskip": 90, "imposs": 80, "imprecis": [41, 70], "improv": [65, 70, 71], "inaccuraci": 26, "incl": 90, "includ": [2, 5, 6, 9, 10, 39, 45, 47, 53, 54, 64, 65, 68, 69, 70, 74, 75, 77, 78, 83, 85], "inclus": 44, "inconveni": 70, "incorpor": 43, "incorrect": [9, 70], "increas": [8, 49, 70, 71, 74, 85], "increasingli": 71, "indefinit": [14, 18, 22, 27, 28, 29, 33, 34, 35], "independ": [71, 88], "index": [43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 67, 70, 71], "indi_agent_reward": [72, 73], "indic": [8, 11, 12, 44, 47, 52, 66, 67, 76, 86], "individu": [7, 12, 65, 76], "industri": 88, "inf": [55, 56, 57, 58, 59, 60, 61, 62, 63, 65], "inf_mask": 87, "infer": [10, 47, 71, 72, 73, 79, 80], "infin": 62, "info": [2, 3, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93], "inform": [1, 2, 3, 7, 8, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 74, 77, 86, 87, 88, 89, 90, 91, 92, 93], "inher": 46, "inherit": [6, 10], "inidivdu": [72, 73], "init": [10, 12, 71, 75, 76, 79, 80, 87, 89], "init_hp": [71, 72, 73], "initi": [6, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 71, 72, 73, 79, 80, 90], "initial_epsilon": 87, "initialpopul": [71, 72, 73], "inproceed": 64, "input": [5, 6, 10, 38, 54, 67, 71, 72, 73], "input_dict": [87, 89], "insert": [2, 3, 6, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69], "insid": [8, 63], "inspect": [11, 86], "inspir": [12, 68, 76], "instal": [1, 7, 8, 10, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "instantan": [2, 9], "instanti": [71, 72, 73], "instantli": 90, "instead": [4, 6, 8, 10, 13, 17, 40, 43, 47, 70, 71], "institut": 71, "instruct": [70, 75, 86], "instrument": 13, "insuffici": [43, 70], "int": [2, 3, 4, 10, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 70, 71, 75, 86, 87, 89, 90, 92, 93, 94], "int64": 10, "int8": [80, 86], "integ": [2, 3, 9, 10, 43, 44, 47, 49, 50, 70, 90], "integr": [70, 75, 78, 85], "intellig": [13, 64], "intend": [4, 11, 55, 68, 81, 91], "intens": [8, 90], "intent": [12, 76], "interact": [2, 3, 4, 7, 10, 38, 54, 69, 70, 71, 85, 86], "interest": [27, 70, 71], "interfac": [9, 68, 69, 85, 91, 95], "intermit": 8, "intern": [2, 4, 9, 10, 11, 64, 79, 80], "internal_render_mod": 10, "internet": 86, "interpol": 8, "intersect": 46, "interv": 71, "introduc": [8, 13, 71], "introduct": 96, "introductori": 74, "invad": [8, 13, 72], "invalid": [2, 80, 90], "invis": [17, 20, 30], "invisible_invad": 30, "involv": [24, 51, 85], "io": [90, 91, 92, 93], "is_avail": [12, 71, 72, 73, 75, 76, 94, 97], "is_first": 4, "is_invis": 17, "is_last": [4, 10], "is_paralleliz": 70, "is_vector_env": 75, "isinst": [2, 11, 75, 94, 97], "isort": [70, 86], "issu": [2, 10, 11, 27, 40, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "item": [12, 67, 72, 73, 75, 76, 86, 90], "item_1": 10, "item_2": 10, "iter": [9, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 71], "its": [8, 9, 10, 11, 25, 39, 40, 42, 45, 46, 47, 48, 49, 51, 54, 65, 71, 94], "itself": [9, 40, 66, 71, 87, 89, 90], "j": [8, 13, 40, 48, 66], "jab": 15, "jack": 48, "jacob975": 70, "jammf": 70, "jayesh": 64, "jean": 54, "jet": [7, 12, 16, 76], "jjshoot": [12, 70, 76], "joel": 13, "join": [70, 71, 72, 73, 75, 94, 97], "joint": 65, "jordan": 7, "joschu": [12, 75, 76], "journal": [8, 13, 42, 54], "joust": 13, "joust_v3": 24, "jump": [34, 35], "jun": [7, 13], "junyu": 42, "just": [8, 9, 10, 11, 40, 90], "k": [8, 13, 40, 45, 47, 48, 50, 51, 64, 66, 75], "kallinteri": 70, "kaz": 70, "kchour": 70, "keep": [8, 16, 25, 39, 54, 65, 67, 71, 78, 81, 90], "kei": [2, 3, 9, 15, 16, 17, 31, 39, 40, 41, 57, 66, 70, 72, 73, 75, 77, 90, 92, 93], "kept": 10, "kernel": [71, 72], "kernel_s": [71, 72], "kick": 25, "kill": [4, 40], "killable_arch": 40, "killable_knight": 40, "king": [43, 45, 48], "kingsid": 43, "kir0ul": 70, "kl": [12, 75, 76], "knee": 65, "knight": [2, 4, 13, 38, 43, 70, 91], "knight_0": 40, "knight_1": 40, "knights_archers_zombi": [10, 40, 70], "knights_archers_zombies_v0": 10, "knights_archers_zombies_v10": [9, 10, 38, 40, 69, 92], "knock": [25, 45], "knock_reward": 45, "know": [56, 71], "knowledg": 47, "known": [8, 27, 45, 59], "ko": 15, "kochenderf": 64, "komi": 46, "kw": 87, "kwarg": [4, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 87, 89, 90], "kwei": 42, "l": [40, 75], "laboratori": 64, "lai": 42, "laid": 78, "lambda": [11, 75, 86, 87, 89, 94, 95], "lambda_": 89, "landmark": [54, 55, 56, 57, 58, 59, 60, 61, 62, 63], "landmark_id": [58, 59], "landmark_rel_posit": [55, 56, 61, 62, 63], "langchain": 70, "languag": [54, 85], "laptop": [90, 92], "larg": [2, 62, 65, 67, 70, 96], "largest": [8, 47, 49, 90], "last": [2, 4, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 86, 87, 89, 90, 92, 93], "last_opp_mov": 71, "lastgaelam": 75, "latest": [43, 71], "latest_polici": [90, 92, 93], "launch": [13, 38, 42, 54, 64, 90, 92, 93], "layer": [9, 12, 22, 71, 72, 73, 75, 76], "layer_init": 75, "layout": 43, "ldot": 46, "leadadversary_0": 63, "leader": 63, "leader_comm": 63, "leaderboard": 77, "leaf": 2, "learn": [2, 3, 5, 7, 8, 12, 13, 27, 38, 39, 41, 42, 56, 57, 58, 61, 64, 68, 69, 70, 72, 73, 74, 75, 76, 77, 88, 90, 91, 92, 93, 94, 96], "learn_step": [71, 72, 73], "learnabl": 70, "learner": [12, 76], "learning_r": [75, 93], "least": [10, 27, 47, 78, 96], "leav": [2, 13, 26, 30, 32], "leduc": [42, 70, 87, 90], "leduc_holdem": 48, "leduc_holdem_v4": [48, 87, 90], "leduoc": 87, "leela": [70, 88], "leelachesszero": 43, "left": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 46, 47, 54, 65, 66, 70, 71, 79, 80], "left_paddle_spe": [9, 39], "leftmost": 65, "leg": 65, "legal": [42, 71, 86], "legal_mov": 47, "len": [10, 12, 71, 72, 73, 76, 89, 92, 93, 94, 97], "length": [2, 3, 8, 9, 12, 46, 47, 65, 67, 71, 76, 94], "less": [13, 30, 71, 92], "lesson": 71, "lesson1_trained_ag": 71, "lesson2_trained_ag": 71, "lesson3_trained_ag": 71, "lesson4_trained_ag": 71, "lesson_numb": 71, "let": [33, 71, 91], "level": [9, 30, 32, 37, 61, 71, 81], "leverag": [92, 93], "librari": [9, 13, 42, 68, 70, 74, 77, 88, 91], "lidar": 65, "life": [20, 24, 25, 37, 47, 70], "lightweight": [9, 77, 96], "like": [2, 3, 8, 9, 10, 11, 12, 13, 17, 22, 39, 40, 43, 47, 54, 65, 68, 70, 71, 76, 86, 87, 89, 90], "limit": [2, 4, 42, 48, 67, 70], "line": [10, 12, 40, 52, 67, 70, 71, 76, 79, 80, 91, 96], "line_death": 40, "linear": [8, 12, 75, 76, 89], "linear_interp": 8, "linearli": 8, "link": [68, 70], "lint": 70, "linux": 9, "list": [2, 3, 4, 9, 10, 12, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 71, 72, 73, 76, 90, 94, 97], "listen": [54, 59, 73, 74], "listener_0": 60, "liter": 32, "littl": 39, "live": [3, 6, 10, 25, 30, 37, 70], "lizard": [49, 70], "load": [7, 70, 71, 72, 73, 87, 89, 90, 92, 93, 94, 95], "load_state_dict": [71, 94], "loadcheckpoint": [71, 72, 73], "local": [41, 59, 61, 67, 70], "local_dir": 89, "local_ratio": [41, 59, 61, 65, 67, 70], "local_reward": 41, "locat": [21, 27, 44, 46, 63, 67, 71, 81], "locomot": 7, "log": [4, 12, 70, 71, 75, 76, 87, 96, 97], "log_level": [87, 89], "log_path": 94, "log_prob": [12, 75, 76], "logdir": 94, "logger": [4, 10, 94], "logic": [5, 6, 10, 12, 47, 70, 75, 76, 78, 83], "logical_and": 71, "logit": [12, 75, 76, 87], "logo": 70, "logprob": [12, 75, 76], "logratio": [12, 75, 76], "long": [11, 12, 15, 27, 32, 75, 76, 85, 90], "longer": [8, 10, 14, 18, 20, 22, 27, 28, 29, 33, 34, 35, 40, 41, 70, 92], "longest": [19, 39, 90], "look": [2, 9, 10, 11, 13, 26, 40, 70, 71], "loop": [2, 68, 70, 72, 73, 89], "lose": [4, 6, 19, 20, 24, 25, 26, 37, 42, 45, 47, 71, 86], "loser": [43, 45, 46, 48, 49, 50, 51, 52], "loss": [12, 42, 47, 75, 76, 90], "loss_avoiding_act": 71, "lost": [47, 67], "lot": 85, "low": [8, 54, 71, 72, 73, 87], "lowe2017multi": 54, "lower": [9, 40, 41], "lower_bound": [8, 72, 75], "lowest": 47, "lr": [12, 71, 72, 73, 75, 76, 89, 94, 97], "lr_actor": [72, 73], "lr_critic": [72, 73], "lrnow": 75, "lru_cach": [10, 79, 80], "lst": 71, "lurk": [19, 20], "m": [1, 13, 40, 51, 71, 90, 92, 93], "mace": 40, "machado": [8, 13], "machado2018revisit": 13, "machin": 68, "maco": [9, 70], "maddpg": [70, 74], "maddpg_trained_ag": 72, "made": [1, 4, 44, 64, 65, 68, 70, 86], "madrl": [8, 64], "magent": 70, "magent2": [2, 70], "magnitud": [8, 67], "mahjong": 70, "mai": [2, 3, 9, 10, 43, 46, 67, 68, 71, 90], "main": [3, 25, 26, 43, 44, 45, 46, 47, 48, 50, 51, 52, 56, 85, 86], "maintain": [43, 68, 70], "major": [64, 67, 68, 70], "make": [1, 2, 4, 6, 8, 9, 11, 20, 27, 30, 39, 40, 41, 43, 44, 45, 46, 47, 49, 52, 54, 65, 66, 67, 70, 71, 74, 81, 85], "makedir": [71, 72, 73, 97], "man": 36, "manag": [4, 71, 85], "maneuv": 23, "mani": [2, 4, 8, 11, 40, 42, 68, 70, 71, 77, 80, 86, 90], "manner": [6, 54], "manu": 70, "manual": [2, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 70], "manual_control": 70, "manual_polici": [38, 70], "manual_se": [75, 94, 97], "manualpolici": 38, "map": [10, 16, 17, 20, 21, 26, 27, 31, 47, 54, 66, 70, 71], "marc": 13, "mario": 13, "mario_bro": 25, "mario_bros_v3": 25, "maritim": 68, "mark": [2, 7, 52, 90], "markdown": [1, 70], "markov": 71, "markovvectorenv": 92, "marl": [2, 8, 69, 94, 97], "marlo": 13, "mask": [8, 10, 42, 70, 71, 83, 87, 91], "mask_fn": 90, "maskabl": 90, "maskableactorcriticpolici": 90, "maskableppo": 90, "mass": 41, "massiv": [68, 70], "master": [32, 70, 71, 75, 90, 92, 93], "mat": 70, "match": [4, 10, 33, 68, 70, 87, 94], "matd3": [70, 74], "matd3_trained_ag": 73, "materi": [43, 70], "matrix": [7, 40], "matter": [9, 11], "matthew": 13, "max": [8, 12, 13, 47, 70, 71, 72, 73, 75, 76, 90, 92, 93], "max_act": [71, 72, 73], "max_arrow": 40, "max_batch_s": [71, 72], "max_cycl": [9, 11, 12, 13, 39, 40, 41, 49, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 76, 86, 89, 92], "max_cycles_test": 11, "max_episod": [4, 71, 72, 73], "max_epoch": 97, "max_fram": 70, "max_grad_norm": 75, "max_information_token": 47, "max_it": 9, "max_learn_step": [71, 72], "max_length": 71, "max_life_token": 47, "max_lr": [71, 72], "max_num_ag": [2, 3, 9], "max_observation_v0": [8, 13, 75], "max_reward": 39, "max_skip": 8, "max_step": [4, 71, 72, 73], "max_train_episod": 71, "max_zombi": [40, 92], "maxandskip": [8, 13], "maxim": [13, 27, 30, 64, 86], "maximis": 71, "maximum": [8, 13, 40, 47, 65, 67, 70, 71, 72, 73, 75], "maxlen": [71, 86], "maxpool2d": [12, 76], "maxsiz": [10, 79, 80], "maze": [13, 17, 19, 20], "maze_craz": 26, "maze_craze_v3": 26, "mb_advantag": 75, "mb_ind": 75, "mclean": 70, "md": [1, 70, 78], "mean": [9, 10, 12, 14, 18, 20, 22, 27, 28, 29, 33, 34, 35, 37, 40, 41, 44, 49, 54, 56, 65, 66, 70, 71, 72, 73, 75, 76, 78, 94], "mean_fit": 71, "mean_reward": [94, 97], "mean_scor": 71, "mean_turn": 71, "mean_turns_per_gam": 71, "mechan": 8, "medium_env": 90, "meet": 70, "meltingpot": 68, "meltingpot_compat": 7, "meltingpotcompatibilityv0": 7, "mem_ful": 71, "member": 71, "memoiz": [10, 79, 80], "memor": 13, "memori": [8, 21, 26, 71, 72, 73], "memory_s": [71, 72, 73], "mental": 2, "merg": [49, 70], "messag": [4, 9, 11, 54, 57, 70], "message_histori": 86, "metadata": [10, 70, 71, 78, 79, 80, 90, 92, 93], "method": [3, 8, 9, 10, 11, 39, 43, 54, 65, 70, 71, 79, 80, 90], "metric": 85, "mgoulao": 70, "michael": [13, 72, 73], "microwrapp": 8, "middl": 79, "might": 71, "mikcnt": 70, "mikepratt1": [70, 72, 73], "million": 75, "mimwrit": [71, 72, 73], "min": [62, 71], "min_act": [71, 72, 73], "min_batch_s": [71, 72], "min_learn_step": [71, 72], "min_lr": [71, 72], "min_skip": 8, "mind": 54, "mini": 75, "miniatur": 68, "minibatch": 75, "minibatch_s": 75, "minigo": 46, "minim": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 37, 47, 70, 78, 95, 97], "minimap": 70, "minimum": [8, 50, 51, 61, 63, 67, 71, 90], "minor": [40, 41, 54, 70], "minut": [15, 90, 92, 93], "mirror": 75, "misc": [39, 40, 41, 65, 66, 67, 70], "miscellan": 70, "missil": 16, "mistak": 71, "mistakenli": 70, "misus": 70, "mix": [24, 25, 54], "mixtur": 54, "ml": [68, 70, 88, 94, 95, 97], "mlp": [71, 72, 73, 90, 91, 93], "mlppolici": [92, 93], "mode": [2, 3, 6, 8, 9, 10, 11, 16, 17, 26, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 70, 72, 75, 89, 92], "model": [2, 9, 72, 73, 74, 85, 86, 87, 89, 90, 91, 92, 93, 94, 97], "model_config": 87, "model_out": 89, "model_save_path": [94, 97], "modelcatalog": [87, 89], "modern": [13, 68], "modifi": [71, 75], "modul": [9, 12, 70, 75, 76, 89, 90, 92, 93], "modular": [77, 81, 96], "momentum": [31, 41], "monitor_gym": 75, "month": 13, "mordatch": 54, "mordatch2017emerg": 54, "more": [1, 2, 3, 7, 9, 10, 25, 27, 30, 31, 37, 39, 45, 46, 47, 49, 54, 61, 68, 70, 71, 74, 77, 78, 80, 87, 88, 89, 90, 91, 92, 93], "most": [6, 8, 9, 10, 13, 27, 42, 49, 54, 70, 71, 90], "mostli": [42, 54], "motion": [35, 54], "move": [4, 6, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 60, 66, 67, 70, 71, 79, 80, 86, 90], "move_down": [56, 58, 59, 60, 61, 62, 63], "move_left": [56, 58, 59, 60, 61, 62, 63], "move_right": [56, 58, 59, 60, 61, 62, 63], "move_up": [56, 58, 59, 60, 61, 62, 63], "moveaxi": [71, 72, 73], "movement": [16, 41, 54, 80], "moving_shield": 30, "mpe": [55, 56, 57, 58, 59, 60, 61, 62, 63, 70, 71, 72, 73], "mpe_environ": 70, "mqueue": 4, "much": [8, 30, 41, 70, 71, 90], "multi": [2, 3, 9, 13, 54, 64, 68, 69, 70, 72, 73, 74, 86, 88, 91, 96], "multi_ag": 87, "multi_agent_replay_buff": [72, 73], "multiag": [3, 55, 64, 68], "multiagentenv": 70, "multiagentpolicymanag": [94, 95, 97], "multiagentreplaybuff": [72, 73], "multibinari": 2, "multidiscret": [2, 79, 80], "multipl": [2, 34, 67, 68, 70, 74, 86], "multiplay": [13, 68], "multipli": [65, 67], "multithread": [92, 93], "multiwalk": [64, 70], "multiwalker_v9": [6, 65], "murtazarang": 70, "must": [2, 3, 6, 9, 10, 14, 22, 23, 27, 28, 29, 32, 34, 35, 39, 40, 41, 43, 44, 46, 47, 49, 52, 54, 57, 58, 60, 61, 65, 66, 67, 71, 79, 80, 90], "mutat": [71, 72, 73], "mutation_sd": [71, 72, 73], "mutual": 2, "mykel": 64, "m\u016b": 68, "n": [2, 4, 8, 9, 12, 40, 43, 46, 49, 56, 61, 71, 72, 73, 75, 76, 79, 80, 87, 90, 94, 97], "n_agent": [72, 73], "n_catch": 66, "n_coop": 67, "n_cycl": 70, "n_episod": [94, 95], "n_evad": [66, 67], "n_obstacl": 67, "n_piston": [41, 89], "n_poison": 67, "n_pursuer": [66, 67], "n_sensor": 67, "n_step": [71, 94, 97], "n_walker": 65, "naddaf": 13, "name": [2, 3, 4, 8, 9, 10, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 70, 71, 75, 78, 79, 80, 86, 87, 89, 90, 92, 93], "namespac": 94, "nan": [4, 8, 12, 70, 75, 76], "nan_noop_v0": 8, "nan_random_v0": 8, "nan_zeros_v0": 8, "narg": [75, 94], "narrow": 21, "natur": [2, 54, 80], "navig": [19, 20, 60, 67], "ncp": 37, "ndarrai": [2, 3, 47], "ne": 43, "necessari": [8, 10, 71, 72, 73, 79, 80], "necessarili": 10, "need": [1, 4, 9, 10, 11, 19, 20, 21, 27, 31, 67, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "neg": [39, 45, 56, 62, 67, 71, 90], "negat": 47, "neighbor": [65, 67], "neighbour": 65, "nest": 2, "net": [12, 35, 75, 76, 94, 97], "net_config": [71, 72, 73], "network": [2, 8, 10, 12, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 71, 72, 73, 75, 76, 87, 94, 97], "neural": [8, 43, 54, 71], "never": [9, 45, 70], "nevertheless": 43, "new": [4, 5, 9, 10, 11, 25, 26, 27, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 68, 70, 71, 72, 73, 83, 85, 90], "new_height": 71, "new_layer_prob": [71, 72, 73], "new_width": 71, "newli": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "newlogprob": [12, 75, 76], "newvalu": 75, "next": [2, 4, 6, 9, 10, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 90, 91], "next_ag": 90, "next_don": 75, "next_ob": [12, 75, 76], "next_stat": [71, 72, 73], "next_termin": 75, "next_trunc": 75, "next_valu": 75, "nextnontermin": 75, "nextvalu": 75, "nhvkkya6qx": 70, "nick": [71, 72], "nicku": [70, 71, 72, 73], "nickua": 73, "nip": 54, "nn": [12, 75, 76, 87, 89], "no_act": [56, 58, 59, 60, 61, 62, 63], "no_grad": [12, 71, 75, 76], "no_mov": 10, "no_mut": [71, 72, 73], "no_op_act": 8, "node": 2, "nois": 65, "noisi": 65, "non": [11, 13, 38, 40, 42, 46, 70, 71, 91], "non_zero": 71, "none": [2, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 97], "noop": 8, "noqa": [75, 86], "norm": [67, 75], "norm_adv": 75, "normal": [8, 11, 12, 30, 33, 40, 63, 65, 71, 72, 75, 76], "normalize_obs_v0": [8, 89], "notabl": [13, 70], "notat": 43, "note": [2, 4, 6, 8, 9, 10, 17, 19, 20, 25, 26, 27, 34, 37, 40, 42, 43, 45, 54, 63, 64, 66, 68, 71, 75, 79, 80, 81, 90, 91, 92, 93], "noth": [27, 34, 40, 54, 86], "notori": 85, "novel": 7, "now": [10, 40, 68, 70, 71, 72, 73, 79, 81, 86], "np": [8, 10, 12, 62, 71, 72, 73, 75, 76, 79, 80, 87, 94, 97], "npc": [24, 37], "nstart": [92, 93], "nth": [2, 9, 46], "num": [75, 94], "num_act": [12, 49, 76], "num_adversari": [62, 63], "num_ag": [2, 3, 6, 9, 12, 72, 73, 76], "num_arch": 40, "num_atom": 71, "num_col": 71, "num_cpu": [75, 92, 93], "num_cycl": [11, 70, 81], "num_env": 75, "num_food": 63, "num_forest": 63, "num_fram": 8, "num_gam": [90, 92, 93], "num_good": [62, 63], "num_gpu": [87, 89], "num_it": 10, "num_knight": 40, "num_minibatch": 75, "num_mov": 10, "num_obstacl": [62, 63], "num_output": [87, 89], "num_play": [14, 22, 28, 35, 50, 51, 70, 86], "num_rollout_work": [87, 89], "num_row": 71, "num_sgd_it": 89, "num_step": [12, 75, 76], "num_sword": 40, "num_upd": 75, "number": [2, 4, 6, 8, 10, 11, 12, 13, 14, 15, 22, 26, 27, 28, 30, 32, 33, 35, 40, 41, 43, 46, 47, 48, 49, 50, 51, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 75, 76, 90, 92, 96], "numer": [40, 70], "numpi": [2, 3, 8, 9, 10, 12, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 87, 94, 97], "nw": 43, "o": [4, 40, 52, 71, 72, 73, 75, 86, 87, 89, 90, 92, 93, 94, 97], "ob": [12, 70, 75, 76, 86, 87, 89, 90, 92, 93], "object": [4, 39, 41, 45, 67, 71, 72, 73], "obs_buff": 86, "obs_len": 87, "obs_messag": 86, "obs_rang": 66, "obs_spac": [87, 89], "obs_typ": 13, "obsdict": 70, "observ": [2, 3, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 66, 68, 69, 70, 71, 72, 73, 76, 79, 80, 85, 86, 87, 89, 90, 91, 92, 93, 94, 97], "observation_s": [12, 76], "observation_spac": [2, 3, 9, 10, 12, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 70, 71, 72, 73, 75, 76, 78, 79, 80, 87, 90, 94, 97], "observation_typ": 47, "observation_vector_dim": 47, "obsolet": 10, "obstacl": [17, 32, 54, 62, 63, 66, 67], "obstacle_coord": 67, "obstacle_radiu": 67, "obstyp": [2, 3, 6], "occasion": 39, "occupi": 43, "occur": 86, "odd": [49, 70], "off": [11, 13, 17, 25, 39, 41, 65, 67, 75, 91], "off_screen_penalti": 39, "offens": 23, "offer": 74, "offici": [9, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 70, 77], "offlin": 71, "offpolicy_train": [94, 97], "often": [2, 10, 13, 54], "old": [8, 10, 12, 26, 71, 76], "old_approx_kl": [12, 75, 76], "oldest": [43, 71], "olymp": [14, 22, 28, 29, 35], "onc": [1, 2, 3, 18, 32, 42, 70, 71], "one": [2, 6, 8, 9, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 60, 68, 70, 71], "one_hot": [71, 72, 73], "ones": [10, 43, 80], "onli": [2, 3, 6, 10, 11, 13, 17, 18, 19, 20, 26, 30, 40, 42, 45, 47, 49, 54, 59, 65, 70, 71, 75, 90, 91, 96], "onlin": 68, "onto": [25, 35], "open": [8, 10, 13, 17, 68, 71, 77, 88], "openai": [8, 13, 54, 86], "openscenario": 68, "openspiel": [2, 47, 70], "openspiel_compat": 7, "openspielcompat": 70, "openspielcompatibilityv0": 7, "oper": [8, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 74], "opp": 71, "opp_three_count": 71, "opp_three_in_row": 71, "opp_update_count": 71, "oppon": [14, 15, 16, 17, 19, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 44, 45, 46, 48, 49, 66, 71, 94], "opponent_difficulti": 71, "opponent_first": 71, "opponent_path": 94, "opponent_pool": 71, "opponent_pool_s": 71, "opponent_upd": 71, "opponent_upgrad": 71, "opponents_hand_vis": 45, "opportun": [25, 37, 71], "oppos": [2, 54], "opposit": [20, 71], "optim": [12, 20, 38, 41, 65, 66, 71, 75, 76, 85, 89, 90, 92, 93, 94, 97], "optimis": [71, 72, 73, 74], "option": [2, 3, 10, 11, 13, 30, 39, 40, 41, 43, 44, 45, 46, 47, 49, 52, 54, 65, 66, 67, 70, 71, 79, 80, 90, 94, 97], "orang": 66, "orchestr": 74, "order": [2, 4, 6, 21, 27, 40, 45, 47, 49, 70, 85, 90, 92], "orderenforcingwrapp": [6, 10], "ordinari": 47, "org": [10, 79, 80, 90], "organ": 64, "orient": [43, 54, 65], "orig_obs_spac": 87, "origin": [4, 6, 8, 13, 43, 54, 64, 70], "orthogonal_": [12, 75, 76], "othello": 13, "othello_v3": 27, "other": [2, 5, 6, 8, 9, 10, 11, 13, 20, 22, 25, 26, 29, 30, 32, 35, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 59, 60, 61, 63, 65, 66, 67, 70, 71, 74, 85], "other_agent_rel_posit": [56, 58, 61, 62, 63], "other_agent_veloc": [62, 63], "other_agents_rel_posit": 56, "otherwis": [6, 21, 39, 43, 47, 90], "our": [1, 2, 6, 9, 10, 12, 13, 43, 45, 46, 48, 51, 70, 71, 76, 81, 83], "out": [4, 6, 11, 12, 15, 32, 39, 54, 68, 70, 71, 72, 73, 74, 75, 76, 78, 89, 90], "outcom": [71, 86], "outperform": 90, "output": [4, 5, 6, 8, 10, 11, 54, 70, 87], "output_kei": 86, "output_pars": 86, "outsid": [2, 3, 4, 6, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 70, 78], "over": [2, 4, 8, 10, 13, 25, 27, 34, 37, 39, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 57, 67, 70, 71, 79, 80, 85, 87], "overal": 41, "overestim": 73, "overhaul": 70, "overhead": 9, "overridden": [10, 79, 80], "overview": 10, "overwrit": [79, 80], "own": [11, 12, 21, 27, 39, 40, 46, 47, 54, 69, 71, 76, 78], "p": [71, 79, 80], "p0_action": 71, "p0_action_mask": 71, "p0_next_stat": 71, "p0_next_state_flip": 71, "p0_state": 71, "p0_state_flip": 71, "p1_action": 71, "p1_action_mask": 71, "p1_next_stat": 71, "p1_next_state_flip": 71, "p1_state": 71, "p1_state_flip": 71, "pa_model": 87, "packag": [1, 7, 8, 10, 65, 70, 71, 78, 94, 95, 97], "pad": [8, 12, 40, 43, 71, 76], "pad_action_space_v0": 8, "pad_observ": 40, "pad_observations_v0": 8, "paddl": [22, 29, 39], "paddle_0": 39, "paddle_1": 39, "page": [13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 70], "pair": 49, "paper": [2, 3, 10, 43, 64, 66, 70, 75, 88, 90, 95], "par_env": 6, "paradigm": [3, 70], "parallel": [2, 5, 8, 12, 43, 44, 45, 46, 47, 48, 50, 51, 52, 69, 70, 72, 73, 74, 75, 76, 78, 83, 88, 89, 93], "parallel_api_test": [3, 11, 70, 81], "parallel_env": [3, 6, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 72, 73, 75, 76, 89, 92, 93], "parallel_env_fn": 11, "parallel_rp": 10, "parallel_seed_test": [11, 70], "parallel_test": 70, "parallel_to_aec": [6, 10, 70, 79, 80], "parallel_to_aec_wrapp": 6, "parallel_wrapper_fn": 70, "parallelenv": [6, 10, 78, 79, 80], "parallelpettingzooenv": 89, "param": [12, 71, 75, 76], "param_group": 75, "paramet": [6, 8, 9, 12, 41, 47, 59, 61, 67, 70, 71, 72, 73, 74, 75, 76, 88, 91, 94, 97], "parametr": 90, "parametricactionsmodel": 87, "pariti": 49, "parrellenv": 70, "pars": [8, 86, 94], "parse_arg": [75, 87, 89], "parse_known_arg": 94, "parser": [75, 87, 89, 94], "part": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 70, 71, 79, 88], "parti": 70, "partial": [2, 3, 11, 68, 70], "particl": [54, 73, 74], "particular": [6, 9, 10, 20, 26, 40, 63, 70], "pass": [4, 8, 9, 10, 11, 22, 23, 26, 40, 46, 70, 78], "passant": [43, 70], "past": [22, 23, 28, 33, 47, 70], "path": [2, 13, 16, 32, 40, 70, 71, 72, 73, 75, 81, 87, 89, 90, 92, 93, 94, 97], "pattern": 8, "pawn": [43, 80], "pbar": 71, "peculiar": 8, "penal": [15, 16, 17, 21, 31, 45, 61, 62, 67, 90], "penalti": [39, 45, 65, 70], "penni": 68, "peopl": 71, "pep": 70, "per": [2, 8, 13, 18, 24, 47, 67, 71, 75, 92, 94], "perfectli": [46, 54], "perform": [8, 47, 54, 70, 71, 72, 73, 74, 75, 77, 90, 91, 94], "performance_benchmark": 11, "permiss": 70, "permit": 70, "permut": [75, 89], "persist": 85, "perspect": [70, 71], "pest": 25, "pettingzoo": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 71, 72, 73, 75, 76, 78, 79, 80, 81, 83, 85, 87, 89, 91, 92, 93, 94, 95, 97], "pettingzoo_ag": 86, "pettingzoo_env": [87, 89, 94, 97], "pettingzoo_env_to_vec_env_v1": [75, 92, 93], "pettingzooag": 86, "pettingzooenv": [87, 89, 94, 95, 97], "pg_loss": [12, 75, 76], "pg_loss1": [12, 75, 76], "pg_loss2": [12, 75, 76], "philosophi": 2, "physic": [11, 31, 41, 65, 68, 70], "pi": 65, "pick": [43, 45], "pickl": 70, "piec": [27, 34, 43, 46, 70, 71, 85], "pieter": 54, "pil": [71, 72, 73, 89], "pile": [45, 47], "pillow": [70, 71, 72, 73, 87, 89], "pimpal": 70, "pip": [1, 7, 8, 9, 10, 13, 38, 42, 54, 64, 70], "piston": [41, 70], "piston_0": 41, "piston_1": 41, "piston_19": 41, "pistonbal": [3, 12, 38, 70, 76, 77, 87, 88], "pistonball_v6": [3, 4, 6, 9, 10, 11, 12, 38, 41, 76, 87, 89], "pixel": [13, 39, 40, 41, 54, 70], "place": [8, 9, 10, 27, 44, 46, 47, 52, 54, 65, 66, 71, 79], "placehold": [71, 72, 73], "placement": [44, 52], "plagu": 8, "plai": [2, 3, 9, 10, 18, 25, 32, 39, 43, 47, 49, 52, 68, 70, 74, 79, 90, 92, 93, 94, 95, 97], "plain": 8, "plan": [25, 26, 32], "plane": [13, 43, 44, 45, 46, 52], "platform": [13, 96], "play_continu": 71, "playabl": 68, "player": [2, 4, 6, 10, 13, 14, 15, 16, 17, 18, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 68, 70, 71, 75, 79, 86, 91, 94], "player1": 4, "player2": 4, "player_": 10, "player_0": [43, 44, 45, 47, 48, 49, 50, 51, 71, 87], "player_1": [43, 44, 45, 47, 48, 49, 50, 51, 52, 71, 87], "player_2": 52, "player_idx": 75, "pleas": [7, 8, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 73, 75, 76, 78, 86, 87, 89, 90, 92, 93, 94, 95, 97], "plot": 75, "plu": [27, 41, 50, 67], "plugin": 1, "point": [9, 14, 15, 16, 17, 18, 21, 22, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 40, 44, 45, 46, 47, 79, 80, 83, 92], "poison": 67, "poison_reward": 67, "poison_spe": 67, "poker": [51, 70, 88], "polici": [2, 3, 4, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 72, 73, 75, 76, 87, 89, 90, 91, 92, 93, 94, 95, 97], "policy_fn": 89, "policy_freq": 73, "policy_loss": 75, "policy_mapping_fn": 87, "pong": [13, 38, 70], "pong_v3": [28, 75], "pool": 71, "poor": [27, 90], "poorli": 90, "pop": [71, 72, 73], "popul": [54, 71, 72, 73], "popular": [8, 42, 68, 88], "population_s": [71, 72, 73], "pose": 8, "posg": [2, 3, 70], "posit": [16, 17, 24, 31, 33, 40, 41, 43, 47, 52, 54, 55, 56, 63, 65, 67, 70, 71, 90, 93], "position_nois": 65, "possibl": [2, 4, 8, 9, 10, 11, 13, 20, 26, 30, 32, 39, 40, 43, 47, 49, 52, 54, 70, 71], "possible_ag": [2, 3, 9, 10, 12, 70, 76, 79, 80, 86, 87, 89, 90, 92, 93], "post": 91, "pot": 51, "potenti": [2, 17, 25, 70], "power": [15, 19, 20, 85], "powerup": 20, "ppo": [12, 68, 77, 87, 88, 91], "ppo_mask": 90, "ppo_pettingzoo_ma_atari": 75, "ppo_pettingzoo_ma_ataripi": 75, "ppo_pistonball_v6_660ce_00000_0_2021": [87, 89], "ppoagent": 89, "ppoconfig": 89, "pr": [9, 70], "practic": [71, 81], "pragmat": 71, "pre": [5, 8, 70, 71, 72, 91, 92, 94], "precis": [13, 15, 18], "predat": 62, "predefin": 8, "predict": [17, 31, 33, 87, 90, 92, 93], "prefer": 8, "prei": 62, "prematur": [19, 20, 24, 25, 26, 36, 37, 40, 65], "prepend": 40, "preprint": [8, 13, 42, 54], "preprocess": 88, "present": 4, "press": [34, 40], "pretrain": [71, 87, 89], "pretrained_path": 71, "pretti": [10, 79, 80], "prevent": [8, 14, 18, 22, 27, 28, 29, 33, 34, 35, 63, 80], "previou": [10, 13, 43, 47, 65, 70, 71, 72, 73, 80], "primarili": 55, "print": [2, 3, 4, 6, 9, 10, 11, 12, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94, 97], "prior": 8, "prior_ep": 71, "priorit": 71, "prioriti": 71, "prison": [7, 68, 70, 79, 80], "prisoner_act": [79, 80], "prisoner_action_mask": 80, "prisoner_i": [79, 80], "prisoner_x": [79, 80], "prisoners_dilemma_in_the_matrix__arena": 7, "privat": 57, "private_kei": 57, "prob": [12, 75, 76], "probabl": [2, 8, 9, 71, 72, 73, 87, 89], "probit": 87, "problem": [8, 13, 65, 68, 69, 70, 71], "problemat": 9, "process": [5, 8, 13, 25, 54, 70, 71, 72, 73, 78, 83, 91, 92], "produc": [11, 13, 67, 91], "product": [59, 63], "profici": 43, "program": 2, "progress": [2, 3, 9, 71], "project": [70, 71, 75, 83], "promot": 43, "proper": [43, 46, 70, 79, 80], "properli": [11, 90], "properti": 65, "proport": [41, 66, 67], "propos": 70, "prospector": 70, "protect": 30, "protocol": [8, 13], "provid": [2, 3, 4, 5, 6, 10, 40, 41, 70, 71, 74, 77, 85, 86, 87, 89, 91, 92, 96, 97], "proxim": [89, 90, 92, 93], "prune": 66, "pseudo": 70, "pt": [71, 72, 73], "pth": [94, 97], "public": [48, 57, 77], "publish": 70, "puck": 23, "pull": 70, "punch": 15, "punish": 54, "pure": [14, 18, 22, 27, 28, 29, 33, 34, 35, 96], "purpl": 67, "purpos": [55, 75, 91], "pursu": 67, "pursuer": [66, 67, 70], "pursuer_0": [66, 67], "pursuer_1": [66, 67], "pursuer_4": 67, "pursuer_7": 66, "pursuer_max_accel": 67, "pursuer_spe": 67, "pursuit": [64, 70], "pursuit_v4": 66, "push": 54, "put": [10, 17], "py": [1, 10, 38, 70, 75, 78, 79, 80, 81, 90], "pybullet": 68, "pydocstyl": 70, "pygam": [38, 40, 41, 68, 70], "pyglet": 70, "pymunk": [40, 41, 70, 93], "pypi": 70, "pyproject": 70, "pyright": 70, "pytest": [1, 70, 90], "python": [1, 9, 43, 69, 70, 88, 94, 95, 96, 97], "python_vers": [71, 72, 73], "pytorch": [71, 72, 87, 91, 96], "pyyaml": [71, 72, 73], "pz": [12, 76], "q": [40, 48, 71, 87, 94, 97], "qmix": [3, 39, 65], "qol": 70, "quadrapong": [13, 70], "quadrapong_v4": 29, "qualiti": [65, 70, 77, 96], "queen": [43, 48], "queensid": 43, "question": [70, 71, 72, 73, 75, 76, 85, 86, 87, 89, 90, 92, 93, 94, 95, 97], "quickli": [19, 20, 21, 25], "quot": 70, "r": [1, 8, 10, 71, 72, 73, 75, 86], "race": [2, 19, 26, 68], "radiu": 67, "raffaelegalliera": 70, "rai": [70, 87, 89], "rainbow": 71, "rais": [6, 10, 41, 48, 50, 51, 79, 80], "ram": 13, "rand_se": [71, 72, 73], "randint": [79, 80], "random": [2, 4, 8, 11, 12, 13, 38, 39, 41, 42, 47, 54, 64, 67, 70, 71, 74, 75, 76, 79, 80, 86, 90, 92, 93, 94, 95, 96, 97], "random_act": 86, "random_demo": 70, "random_drop": [41, 89], "random_oppon": 71, "random_rot": [41, 89], "random_start_play": 47, "randomli": [8, 26, 54, 57, 66, 71, 79], "randompolici": [94, 95, 97], "rang": [8, 10, 12, 41, 47, 67, 71, 72, 73, 75, 76, 90, 92, 93, 94, 97], "rank": [43, 45, 47], "rapid": 23, "rare": [19, 20], "rate": [40, 71, 72, 73, 75, 94], "rather": [2, 8, 9, 70, 92, 93], "ratio": [12, 41, 70, 75, 76], "raw": [70, 90], "raw_env": [9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67], "ray_result": [87, 89], "rb_action": [12, 76], "rb_advantag": [12, 76], "rb_logprob": [12, 76], "rb_ob": [12, 76], "rb_return": [12, 76], "rb_reward": [12, 76], "rb_term": [12, 76], "rb_valu": [12, 76], "re": [13, 70, 90], "reach": [4, 12, 40, 44, 68, 70, 76], "reaction": 8, "read": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70], "readabl": 70, "readi": [71, 72, 73, 78], "readm": [70, 78], "readthedoc": [90, 92, 93], "real": [41, 68, 86], "realist": 41, "reappli": 8, "reason": [9, 10, 11, 54, 71, 90], "rebuild": 1, "recast": 8, "receiv": [2, 3, 4, 9, 14, 20, 22, 26, 27, 28, 29, 30, 33, 35, 36, 39, 45, 47, 48, 49, 51, 52, 54, 62, 65, 66, 67, 86], "recent": [8, 10, 68, 70, 71], "reciproc": 7, "recommend": [8, 10, 13, 71, 72, 73, 75, 76, 81, 83, 86, 87, 89, 90, 92, 93, 94, 95, 97], "reconstruct": [54, 57], "record": [72, 73, 75], "recordvideo": 75, "red": [47, 54, 56, 62, 66, 67], "redesign": [39, 70], "redid": 70, "redtachyon": 70, "reduc": [10, 70, 73, 79, 80, 92], "reduct": [5, 92], "ref": 70, "refactor": [41, 67, 70], "refer": [12, 45, 48, 51, 54, 65, 67, 69, 70, 71, 76, 85, 90], "reflect": 70, "regardless": 47, "regex": 86, "regexpars": 86, "reginald": 70, "region": [8, 40], "regist": [27, 34, 87], "register_custom_model": [87, 89], "register_env": [87, 89], "registri": [87, 89], "regress": 11, "regular": [51, 71], "reinforc": [2, 3, 5, 7, 8, 13, 42, 64, 68, 69, 71, 74, 77, 88, 91, 96], "reinit": [4, 71], "reiniti": 4, "rel": [12, 27, 40, 43, 54, 59, 61, 63, 65, 76, 81], "relat": [9, 40, 54, 70], "releas": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 64, 65, 66, 67, 68], "relev": [10, 40], "reli": 90, "reliabl": [30, 70, 91], "relu": [12, 75, 76, 89], "remain": [6, 39, 47, 71, 90], "remov": [2, 3, 8, 9, 10, 13, 40, 45, 47, 65, 66, 70, 71, 79, 80, 90, 92], "remove_on_fal": 65, "renam": 70, "render": [2, 3, 4, 6, 7, 9, 10, 12, 13, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 76, 78, 79, 80, 87, 89, 90, 92, 93, 94, 95], "render_fp": 70, "render_mod": [2, 3, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 76, 86, 89, 90, 92, 93, 94, 95], "render_result": 11, "render_test": [11, 70], "repeat": [12, 27, 47, 76, 85], "repeat_action_prob": [8, 13], "repeatedli": 71, "repetit": [43, 70], "repl": 86, "replac": [13, 43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 70, 86], "replai": [71, 72, 73], "replay_buff": 71, "replaybuff": 71, "repo": [70, 74, 86], "report": [67, 70], "repositori": [75, 79], "repres": [2, 8, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 67, 69, 71], "represen": 70, "reproduc": [11, 86], "request": 8, "requir": [1, 2, 8, 9, 10, 11, 20, 25, 38, 49, 66, 70, 71, 78, 79, 80, 87, 89, 90, 92, 94, 95, 97], "rescal": [55, 56, 57, 58, 59, 60, 61, 62, 63], "rese": 9, "research": [7, 8, 13, 42, 45, 48, 51, 54, 71, 77], "resembl": 2, "reset": [2, 3, 4, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93], "reshap": [8, 71, 75], "reshape_v0": 8, "resiz": [71, 91, 92], "resize_fram": 71, "resize_v1": [8, 12, 13, 72, 75, 76, 89, 92], "resized_fram": 71, "resolut": [2, 68], "resolv": 70, "resourc": [2, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 71, 87, 89], "respect": [38, 40, 43, 44, 45, 46, 48, 59, 67, 70], "respond": 86, "respons": 15, "rest": 65, "restrict": [2, 3, 13], "result": [2, 8, 10, 11, 40, 54, 64, 67, 70, 71, 75, 90, 92, 94, 95, 97], "resum": 94, "resume_path": 94, "resurect": 70, "ret": 86, "retreiv": 70, "retri": 86, "retriev": [8, 9, 90], "retry_if_exception_typ": 86, "retry_st": 86, "retryerror": 86, "return": [2, 3, 4, 6, 8, 9, 10, 11, 12, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 62, 65, 66, 67, 70, 71, 72, 73, 74, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 97], "return_info": 70, "return_length": 71, "reusabl": [5, 6, 10], "reveal": [47, 48, 49], "revers": [2, 12, 75, 76], "revisit": [8, 13], "rew": [86, 94, 97], "reward": [2, 3, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 69, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94], "reward_list": [72, 73], "reward_map": 10, "reward_metr": [94, 97], "reward_sum": [87, 89], "rewrit": [40, 70], "rgb": [13, 41, 70], "rgb_arrai": [2, 3, 9, 11, 12, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 76, 89], "rgb_imag": 13, "richard": 71, "right": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 42, 43, 54, 65, 66, 71, 79, 80], "right_paddle_spe": [9, 39], "rightmost": [41, 65], "ring": 15, "riot": 68, "rl": [2, 9, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 71, 72, 73, 75, 77, 90, 91, 96], "rl_hp": [71, 72, 73], "rl_hp_select": [71, 72, 73], "rlcard": [42, 45, 48, 50, 51, 70], "rlcard_env": [45, 48, 50, 51], "rllib": [3, 68, 70], "rllib_leduc_holdem": 87, "rllib_num_gpu": [87, 89], "rnd": 70, "robber": 26, "robot": [7, 65], "robust": 70, "rock": [2, 3, 10, 70, 88, 90, 95], "rock_paper_scissor": 86, "rohan": [87, 89], "rohan138": [87, 89], "role": 68, "rollout": [75, 87, 89], "rollout_fragment_length": [87, 89], "rollov": [12, 76], "rom": [13, 70, 75], "rom_path": [13, 75], "rook": 43, "room": [2, 32], "root": [2, 81], "rotat": [40, 65], "round": [48, 50, 51, 70, 90], "round_reward": 90, "row": [8, 27, 40, 43, 45, 46, 71], "row_count": 71, "rp": [42, 49, 70], "rps_v2": [2, 10, 49, 86, 95], "rstrip": 75, "rule": [27, 43, 71, 86], "rummi": [42, 70], "run": [1, 2, 3, 4, 11, 12, 17, 25, 32, 62, 67, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "run_nam": 75, "ruzh": 42, "ryan": 54, "sabotag": 30, "safe_load": 71, "samaritan": 68, "same": [3, 8, 11, 18, 29, 39, 40, 41, 43, 44, 45, 46, 47, 49, 52, 65, 66, 67, 70, 71, 74, 81, 86, 90, 93], "sampl": [2, 3, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 71, 72, 73, 75, 76, 86, 90, 92], "sane": 10, "satisfi": 47, "save": [12, 46, 71, 72, 73, 76, 89, 90, 92, 93, 94, 97], "save2memori": [72, 73], "save2memoryvectenv": 71, "save_al": 89, "save_best_fn": [94, 97], "save_cod": 75, "save_dir": 4, "save_ob": 70, "save_observ": 4, "save_path": [71, 72, 73], "savecheckpoint": [71, 72, 73], "say_0": [57, 59, 60, 63], "say_1": [57, 59, 60, 63], "say_2": [57, 59, 60, 63], "say_3": [57, 59, 60, 63], "say_4": [59, 60], "say_5": [59, 60], "say_6": [59, 60], "say_7": [59, 60], "say_8": [59, 60], "say_9": [59, 60], "sb3": [70, 91], "sb3_connect_four_action_mask": 90, "sb3_contrib": 90, "sb3actionmaskwrapp": 90, "scalabl": 68, "scalar": [47, 49], "scale": [8, 41, 54, 65, 67, 88], "scale_actions_v0": 8, "scenario": [7, 38, 68], "scenariorunn": 68, "scene": 54, "scenic": 68, "schema": 86, "scheme": [6, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 70], "scipi": 70, "scissor": [2, 3, 10, 70, 88, 90, 95], "scope": 78, "score": [13, 14, 15, 16, 17, 18, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 33, 35, 37, 45, 47, 71, 72, 73, 90], "scratch": [77, 83], "screen": [13, 20, 30, 32, 39, 40, 41, 55, 56, 57, 58, 59, 60, 61, 62, 63, 67, 70], "screen_height": [43, 45, 46, 48, 49, 50, 51, 52], "screen_scal": 44, "script": [1, 70, 75, 90, 92, 93, 96], "sdl_videodriv": [87, 89], "se": 43, "search": [21, 71, 72], "second": [2, 9, 11, 14, 18, 22, 27, 28, 29, 33, 34, 35, 43, 46, 52, 54, 66, 71, 73, 90, 91, 92, 95], "second_0": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "secondari": 3, "section": [20, 43, 44, 45, 46, 47, 48, 50, 51, 52, 66, 70, 71], "secur": [68, 70], "see": [2, 3, 4, 7, 8, 10, 13, 19, 20, 38, 47, 54, 55, 56, 63, 70, 71, 75, 77, 83, 85, 87, 88, 89, 90, 91, 92, 93], "seed": [2, 3, 4, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 69, 70, 75, 76, 78, 79, 80, 90, 92, 93, 94, 97], "seed_test": [11, 70], "seem": 90, "seen": [43, 63], "seer": 47, "select": [2, 4, 9, 10, 12, 18, 34, 41, 66, 70, 71, 72, 73, 76, 85, 86], "self": [2, 10, 12, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 68, 70, 74, 75, 76, 78, 79, 80, 86, 87, 89, 90], "self_in_forest": 63, "self_po": [61, 62, 63], "self_vel": [55, 58, 59, 60, 61, 62, 63], "sens": [8, 67], "sensor": [65, 67], "sensor_rang": 67, "sent": [21, 57], "separ": [9, 11, 71, 81, 90], "seq_len": [87, 89], "sequenc": [2, 13, 40, 44, 45, 85], "sequence_spac": 40, "sequenti": [2, 12, 46, 69, 70, 75, 76, 89], "serial": [47, 70], "serv": [14, 22, 28, 29, 33, 35, 70, 71], "server": [70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "set": [5, 6, 8, 9, 10, 11, 13, 17, 26, 38, 40, 41, 42, 43, 44, 45, 47, 50, 51, 54, 63, 64, 65, 67, 70, 71, 73, 79, 80, 86, 92, 93], "set_ep": [94, 97], "set_postfix_str": 71, "set_random_se": 90, "setup": [12, 70, 78], "seventh": 43, "sever": [40, 54], "sgd_minibatch_s": 89, "shahofblah": 70, "shape": [8, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 87, 94, 97], "share": [8, 30, 66, 88, 91], "shared_reward": [65, 66], "shelf": 91, "shield": 30, "shift": 30, "shimmi": [2, 5, 47, 68, 70], "shimmy2022github": 7, "ship": 30, "shoot": 40, "short": 78, "shorter": 74, "shot": 18, "should": [2, 4, 6, 9, 10, 11, 18, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "show": [2, 12, 47, 49, 52, 71, 72, 73, 75, 76, 77, 87, 88, 89, 90, 91, 92, 93, 95, 97], "shown": [6, 51, 66, 71, 72, 73, 74, 75, 76, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "shuffl": [12, 75, 76], "side": [14, 20, 22, 27], "signal": [54, 57, 65, 70], "signifi": 43, "signific": [8, 47, 70, 71], "significantli": [70, 74, 92, 93], "similar": [2, 3, 5, 6, 9, 10, 31, 43, 46, 51, 60, 63, 69], "similarli": [52, 67], "simpl": [2, 3, 5, 6, 8, 9, 10, 39, 41, 47, 52, 54, 69, 73, 74, 77, 86, 88, 91, 95], "simple_adversari": 56, "simple_adversary_v3": [55, 56, 70], "simple_crypto": 57, "simple_crypto_v3": 57, "simple_env": 70, "simple_push": 58, "simple_push_v3": 58, "simple_refer": [59, 60, 70], "simple_reference_v3": 59, "simple_speaker_listen": 60, "simple_speaker_listener_v4": [60, 73], "simple_spread": [61, 70], "simple_spread_v3": 61, "simple_tag": [62, 63], "simple_tag_v3": [54, 62], "simple_v3": 55, "simple_world_comm": 63, "simple_world_comm_v3": 63, "simpleenv": 70, "simpler": [2, 43, 83, 90], "simplest": 4, "simpli": [11, 49, 70, 71, 86], "simplic": 81, "simplifi": [8, 68], "simul": [65, 67, 68, 86], "simultan": [2, 3, 49, 59, 69, 78], "sinc": [8, 9, 25, 49, 54], "singl": [2, 8, 9, 11, 20, 43, 47, 55, 65, 66, 68, 70, 71, 77, 85, 90, 91, 92, 93], "single_act": 87, "single_action_spac": 75, "single_observation_spac": 75, "singular": 70, "sisl": [6, 65, 66, 67, 70, 93], "site": 70, "situat": 7, "six": [48, 70, 85], "size": [8, 40, 46, 47, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 66, 67, 70, 71, 72, 73, 94, 97], "skill": 71, "skip": [8, 13, 86, 90], "skyjo": 68, "slightli": [45, 71], "slope": 71, "slow": 70, "slower": 62, "slowli": [32, 71], "small": [9, 39, 43, 47, 63, 65, 70, 71], "smaller": [71, 90, 94], "smoother": 70, "so": [6, 8, 9, 10, 11, 13, 27, 29, 30, 32, 35, 41, 43, 47, 52, 54, 62, 68, 70, 71, 75, 79, 80, 86, 90, 92, 93], "social": 7, "soft": [71, 72, 73], "softwar": [7, 96], "sole": 42, "solv": [27, 71], "solvabl": 90, "some": [2, 3, 5, 9, 10, 11, 13, 14, 16, 17, 22, 26, 28, 30, 35, 54, 70, 71, 80, 85, 86], "somehow": 30, "someth": [40, 87, 89], "sometim": [13, 51, 54, 71], "songyi": 42, "soon": 40, "sophist": 71, "sort": 8, "sound": 71, "sourc": [2, 3, 4, 6, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68, 85, 88], "sp": 75, "space": [2, 3, 4, 6, 8, 9, 10, 13, 38, 39, 40, 41, 42, 55, 56, 57, 58, 59, 60, 61, 62, 63, 66, 68, 70, 71, 72, 73, 75, 79, 80, 87, 90, 91, 92, 93, 94, 97], "space_invad": [30, 72], "space_invaders_v2": [8, 13, 30, 72], "space_war": 31, "space_war_v2": 31, "spade": [45, 50, 51], "spawn": [4, 40, 41, 66, 91, 92], "spawn_rat": 40, "speak": 60, "speaker": [54, 59, 73, 74], "speaker_0": 60, "speaker_listen": 73, "special": 9, "specif": [2, 3, 8, 14, 16, 17, 22, 26, 28, 29, 30, 35, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 61, 65, 66, 67, 68, 70, 71, 72, 73, 75, 85], "specifi": [2, 4, 8, 9, 10, 13, 38, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 65, 66, 67, 71, 72, 73, 75, 79, 80], "speed": [16, 39, 65, 67, 92, 93, 96], "speed_featur": 67, "speedup": 70, "sphinx": [1, 70], "split": 56, "spock": [49, 70], "spot": 43, "spread": 54, "springer": 64, "sprite": 13, "sqrt": [12, 75, 76], "squar": [21, 40, 43, 70], "squeez": [72, 73], "ss": [72, 75, 89, 92, 93], "ssd": 68, "stab": 40, "stabil": [71, 72], "stabl": [70, 90, 92, 93], "stable_baselines3": [90, 92, 93], "stack": [5, 8, 12, 43, 46, 76, 91, 92], "stack_siz": [12, 76], "stag": 68, "stage": [2, 18, 20, 71], "stai": [39, 41, 66, 92], "stall": [14, 18, 22, 27, 28, 29, 33, 34, 35, 70], "stand": [36, 44], "standalon": 70, "standard": [2, 3, 4, 8, 11, 13, 46, 47, 49, 51, 69, 70, 85, 96], "stanford": 64, "start": [2, 8, 10, 21, 30, 39, 40, 41, 43, 44, 46, 47, 49, 52, 54, 65, 66, 67, 70, 71, 72, 73, 75, 76, 79, 80, 83, 90, 92, 93], "start_dim": [12, 76], "start_tim": 75, "state": [2, 3, 4, 6, 9, 10, 39, 40, 41, 43, 44, 46, 47, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 79, 80, 85, 87, 89, 91], "state_dict": [71, 94, 97], "state_dim": [71, 72, 73], "state_out": 87, "state_shap": [94, 97], "state_spac": [9, 70], "static": [2, 4, 54, 70], "stationari": 71, "std": [12, 75, 76], "steal": 25, "step": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "step_per_collect": [94, 97], "step_per_epoch": [94, 97], "stick": 8, "sticki": [8, 27], "sticky_act": 13, "sticky_actions_v0": [8, 13], "still": [10, 26, 40, 41, 49, 71], "stochast": [2, 3], "stone": 46, "stop": [4, 71, 72, 73, 86, 87, 89], "stop_after_attempt": 86, "stop_fn": [94, 97], "storag": [12, 75, 76], "store": [2, 9, 10, 47, 71, 78], "store_tru": 94, "str": [2, 3, 4, 10, 11, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 66, 70, 71, 75, 90, 92, 93, 94], "straight": 40, "strategi": [18, 27, 30, 32, 34, 52, 71], "streamlin": [70, 74], "strength": [71, 72, 73], "strftime": [71, 90, 92, 93], "stride": [71, 72, 75, 89], "stride_s": [71, 72], "string": [2, 3, 4, 6, 8, 9, 10, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70], "strip": 90, "strong": 71, "strong_rule_based_oppon": 71, "strongli": 10, "strtobool": 75, "structur": [2, 9, 40, 65, 70, 79, 83, 86], "stubborn": 7, "stuck": [19, 20], "studi": [9, 13, 43], "style": [12, 34, 43, 46, 70, 71, 76], "sub": 91, "subclass": 86, "subprocess": [2, 10, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67], "substanti": 70, "substrat": 7, "substrate_nam": 7, "succe": 22, "success": [15, 18, 54, 71], "successfulli": [1, 27, 44, 70, 71], "suffici": 8, "suggest": 70, "suit": [7, 45, 48, 81], "sum": [4, 14, 18, 22, 24, 25, 27, 28, 29, 33, 34, 35, 47, 54, 61, 71, 72, 73, 86, 90, 92, 93], "sum_of_reward": 86, "summar": 85, "summarywrit": [75, 94], "super": [12, 75, 76, 86, 90], "superior": [70, 73], "supersuit": [5, 10, 12, 13, 70, 71, 72, 73, 75, 76, 87, 88, 89, 91, 92, 93], "support": [2, 3, 4, 6, 8, 9, 10, 11, 13, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 68, 69, 70, 71, 75, 90, 91, 92], "suppress": 4, "suppress_output": 4, "sure": [11, 81], "surprisingli": 8, "surrog": 75, "surround": [13, 41, 46, 66], "surround_v2": 32, "surviv": 67, "sushant1212": 70, "sutton": 71, "svg": 11, "sw": 43, "swap": [52, 71, 72, 73], "swap_channel": [72, 73], "swing": 40, "switch": [2, 9, 23, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70], "sword": 40, "symmetr": 20, "sync_tensorboard": 75, "system": [4, 9, 10, 13, 24, 31, 43, 46, 54, 64, 71], "systemmessag": 86, "t": [8, 9, 10, 12, 30, 33, 47, 56, 62, 70, 75, 76, 90], "tabl": [26, 49, 65, 67], "tac": [70, 94, 97], "tag": [54, 66, 70], "tag_reward": 66, "tai": 7, "take": [2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 18, 27, 34, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 79, 80, 85, 86, 90, 91, 92, 93], "taken": [2, 9, 31, 47, 49, 71, 80], "taller": 8, "talli": 27, "talviti": 13, "tamar": 54, "tank": 13, "target": [47, 56, 59, 67, 71, 72, 73, 75, 94], "target_kl": 75, "target_update_freq": [94, 97], "task": [71, 77], "tau": [71, 72, 73], "td": 71, "teach": 71, "team": [7, 18, 22, 29, 35, 54, 57, 75], "team_siz": 7, "teammat": 20, "technic": 70, "techniqu": [71, 74], "teleport": 39, "tell": [8, 10, 11, 47, 86, 91], "temperatur": 86, "temporarili": [54, 70], "tenac": 86, "tenni": 13, "tennis_v3": 33, "tensor": [12, 75, 76, 87], "tensorboard": [70, 75, 76, 77, 94], "tensorboardlogg": 94, "tensorflow": [87, 89], "term": [12, 27, 43, 76, 86], "term_pursuit": 66, "termin": [2, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93], "terminate_on_fal": 65, "terminate_reward": 65, "terminateilleg": 70, "terminateillegalwrapp": [6, 7], "termini": 86, "terrain": 65, "terrain_length": 65, "terri": [7, 8, 13], "territori": 46, "terry2020arcad": 13, "test": [4, 7, 10, 70, 71, 72, 73, 75, 76, 78, 83, 92, 94, 96], "test_action_flex": 70, "test_action_mask_easi": 90, "test_action_mask_hard": 90, "test_action_mask_medium": 90, "test_collector": [94, 97], "test_env": [87, 94, 97], "test_fn": [94, 97], "test_in_train": [94, 97], "test_kept_st": 11, "test_num": 94, "test_save_ob": 11, "texa": [42, 48, 70, 90], "texas_holdem": 50, "texas_holdem_no_limit": [51, 86], "texas_holdem_no_limit_v6": [51, 86, 90], "texas_holdem_v4": [50, 90], "text": [2, 70, 71, 72, 73, 85, 86], "text_color": [71, 72, 73], "th": [43, 94], "than": [8, 46, 49, 51, 70, 71, 80, 90, 92, 93], "thank": 70, "thei": [9, 10, 11, 12, 14, 15, 17, 20, 26, 27, 28, 30, 33, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 57, 61, 62, 65, 66, 67, 70, 71, 76], "them": [6, 9, 11, 24, 25, 27, 30, 34, 41, 42, 54, 56, 65, 70, 71, 85, 92], "theme": 70, "themikeste1": 70, "themselv": 85, "theoret": [13, 68], "theori": [2, 68], "therefor": [49, 67, 71], "thermomet": 47, "thi": [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "thing": 70, "think": [27, 71, 78, 79], "third": [46, 66, 70], "third_0": [22, 29, 35, 36], "third_party_env": 70, "thorough": 96, "those": [45, 47, 64, 71], "though": [9, 10, 54, 83], "thought": [2, 70], "three": [13, 43, 51, 64, 70, 71], "three_in_row": 71, "three_in_row_count": 71, "threshold": 75, "through": [2, 3, 6, 9, 10, 11, 17, 19, 20, 21, 26, 70, 71, 72, 73, 74, 78, 85], "throw": [47, 70], "thrust": 67, "thrust_penalti": 67, "thu": [9, 41, 58, 94, 95, 97], "ti": 90, "tianshou": 70, "tic": [70, 94, 97], "tic_tac_to": [86, 94], "tictacto": [42, 52, 70], "tictactoe_v3": [6, 52, 86, 90, 94, 97], "tie": [2, 90], "tier": 39, "tiger_d": 70, "tight": 77, "time": [1, 2, 4, 6, 8, 9, 10, 14, 16, 18, 22, 23, 24, 26, 27, 28, 29, 30, 33, 34, 35, 37, 39, 40, 41, 42, 44, 48, 49, 51, 63, 65, 66, 67, 68, 70, 71, 74, 75, 79, 80, 86, 90, 92, 93], "time_penalti": [41, 89], "timelin": 53, "timer": [14, 18, 22, 27, 28, 29, 33, 34, 35, 70], "timestamp": [79, 80], "timestep": [6, 39, 65, 75, 77, 79, 80, 87, 90], "timesteps_tot": [87, 89], "titl": [7, 8, 13, 42, 54, 64], "to_dict": [87, 89], "to_parallel": 70, "tobirohr": 70, "todo": [75, 87, 90], "toe": [70, 94, 97], "togeth": [30, 47, 54, 67], "toggl": [66, 67, 75], "token": [27, 44, 47], "tolist": 71, "toml": 70, "too": 71, "took": [47, 70], "tool": [13, 69, 85], "toolkit": 42, "top": [1, 30, 40, 45, 46, 65, 66, 71, 79], "torch": [12, 71, 72, 73, 75, 76, 87, 89, 94, 97], "torch_determinist": 75, "torch_modelv2": 89, "torch_util": 87, "torchfc": 87, "torchmaskedact": 87, "torchmodelv2": 89, "toreset": 70, "total": [20, 39, 40, 46, 47, 59, 63, 65, 70, 71, 72, 73, 75, 90], "total_episod": [12, 71, 76], "total_episodic_return": [12, 76], "total_reward": 90, "total_step": 71, "total_timestep": [75, 90, 92, 93], "touch": [40, 66, 67], "tournament": [46, 71, 72, 73], "tournament_s": [71, 72, 73], "tournamentselect": [71, 72, 73], "toward": [10, 29, 35, 36, 41, 43, 65], "tower": 7, "tqdm": [71, 72, 73], "track": [16, 47, 71, 75, 77, 78, 90, 91], "tracker": 71, "tradit": [22, 74, 85], "traffic": 68, "trail": 32, "train": [3, 4, 12, 39, 43, 65, 68, 70, 74, 75, 76, 77, 91, 94, 95, 96], "train_action_mask": 90, "train_actions_dict": 71, "train_actions_hist": 71, "train_ag": 94, "train_batch_s": [87, 89], "train_butterfly_supersuit": 93, "train_collector": [94, 97], "train_env": [94, 97], "train_fn": [94, 97], "trainer": [94, 97], "training_num": [94, 97], "trang": [71, 72, 73], "transform": [5, 8, 10, 46], "transient": 70, "transit": [9, 12, 71, 76], "transmit": 54, "transpos": [12, 76], "trap": 27, "travel": 21, "travers": 26, "treat": [8, 9, 71], "tree": 2, "tri": [10, 11], "trigger": 8, "troubleshoot": 70, "true": [4, 8, 9, 13, 16, 17, 30, 39, 40, 41, 45, 47, 54, 65, 66, 67, 70, 71, 72, 73, 75, 79, 80, 86, 89, 90, 92, 93, 94, 97], "truetyp": 71, "trunc": [12, 76, 86], "truncat": [2, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93], "trust": 7, "try": [2, 3, 14, 29, 30, 32, 35, 57, 67, 71, 72, 73, 75, 79, 86, 90, 92, 93], "try_import_torch": 87, "ttf": 71, "ttt": 97, "tunabl": 68, "tune": [77, 87, 89, 90], "tupl": [2, 3, 8, 94, 97], "turn": [2, 4, 6, 8, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 67, 69, 70, 71, 87], "turns_per_episod": 71, "tut": 70, "tutori": [2, 3, 10, 68, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "tutorial2_adding_game_log": 81, "tutorial3_action_mask": 81, "tv": 8, "twin": 73, "two": [3, 8, 11, 13, 15, 18, 22, 23, 25, 28, 29, 30, 39, 40, 41, 43, 45, 46, 49, 51, 65, 67, 70, 71, 79, 90, 91, 95], "txt": [1, 78], "type": [2, 3, 6, 8, 10, 11, 40, 43, 47, 70, 71, 75, 85, 87, 90, 94, 96, 97], "type_onli": [8, 75], "typemask": 40, "typevar": 70, "typic": [2, 3, 9, 10, 54, 67], "typo": 70, "t\u014drere": 68, "u": [1, 40, 71], "ui": 68, "uint8": 8, "ultim": 71, "umutucak": 70, "unari": 47, "unbatchifi": [12, 76], "unchang": 39, "uncom": 71, "under": [65, 70], "underli": [2, 6, 9, 70], "underneath": 9, "underpromot": 43, "understand": [10, 71, 72, 73, 75, 76, 78, 79, 86, 87, 89, 90, 92, 93, 94, 95, 97], "undertak": 71, "unexpect": 70, "unfamiliar": 7, "unforgiv": 24, "uniformli": 54, "unintent": 70, "union": 51, "uniqu": [13, 38, 42, 54, 64], "unit": [40, 41, 54, 66, 71], "uniti": 68, "unknown": 45, "unless": [17, 26, 90, 92], "unlik": [33, 43, 71], "unlimit": 71, "unmaintain": 70, "unnecessari": 70, "unpredict": 40, "unscal": 56, "unsuit": 4, "unsuppress_output": 4, "unsur": [2, 3], "until": [4, 10, 13, 44, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 71, 85], "unwrap": [70, 86, 90, 92, 93], "up": [8, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 41, 43, 45, 54, 56, 66, 70, 71, 74, 79, 80, 92, 93], "upcom": 70, "updat": [2, 3, 6, 8, 10, 70, 71, 72, 73, 75, 79, 80, 90, 94], "update_epoch": 75, "update_per_step": [94, 97], "update_top": 71, "upgrad": [45, 48, 50, 51, 70], "upleft": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37], "upper_bound": [8, 72, 75], "upright": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37], "upstream": 70, "urgency_reward": 66, "url": 7, "us": [2, 3, 4, 6, 7, 8, 9, 11, 12, 13, 19, 20, 21, 38, 39, 40, 41, 42, 43, 45, 46, 47, 48, 51, 54, 57, 64, 67, 69, 70, 75, 76, 78, 79, 80, 81, 84, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "usabl": 70, "usag": [4, 11, 70, 96], "use_ga": 89, "use_typemask": 40, "user": [2, 10, 11, 12, 38, 74, 76, 77], "usual": [43, 44, 45, 46, 47, 48, 50, 51, 52, 78], "util": [2, 3, 5, 7, 9, 11, 69, 70, 71, 72, 73, 75, 85, 87, 90, 91, 94, 97], "uuid": 47, "v": [67, 71, 87, 89, 90, 92, 93, 97], "v0": [10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67], "v1": [10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 79, 80, 91], "v10": [10, 40], "v2": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67], "v3": [14, 18, 19, 20, 22, 24, 25, 26, 27, 28, 29, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 66, 67], "v4": [29, 34, 39, 40, 41, 43, 45, 46, 47, 48, 50, 51, 65, 66, 67], "v5": [39, 40, 41, 43, 46, 47, 51, 65, 70], "v6": [40, 41, 43, 51, 65, 70], "v7": [40, 65], "v8": [40, 65], "v9": 40, "v_clip": [12, 75, 76], "v_loss": [12, 75, 76], "v_loss_clip": [12, 75, 76], "v_loss_max": [12, 75, 76], "v_loss_unclip": [12, 75, 76], "v_max": 71, "v_min": 71, "vacuou": 9, "valid": [2, 5, 6, 10, 27, 86], "valid_action_instruct": 86, "valid_posit": 71, "valu": [3, 4, 6, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 75, 76, 79, 90, 92, 93], "value_fn": 89, "value_funct": [87, 89], "value_loss": 75, "valueerror": [86, 90, 92, 93], "var": [4, 12, 75, 76], "var_i": [12, 75, 76], "vareiti": 10, "vari": [43, 70, 90, 92, 93], "variabl": [2, 4, 10, 40, 70], "variable_env_test": 2, "varianc": [8, 12, 76], "variat": [13, 48, 51], "varieti": [24, 69, 71], "variou": [7, 13, 65, 66, 67, 70], "ve": 64, "vector": [8, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 65, 67, 70, 91, 92, 93, 95], "vector_st": [40, 92], "vectoris": 95, "vectoriz": 40, "vectorreplaybuff": [94, 97], "vehicl": 68, "veloc": [54, 65, 67, 70], "veness": 13, "verbos": [90, 92, 93], "verbose_progress": 11, "veri": [9, 27, 38, 47, 68, 74, 78], "versa": 54, "version": [4, 7, 10, 11, 13, 67, 70, 71, 78, 87, 94, 95, 97], "vertic": [41, 44, 52, 67, 71], "vertical_thrust": 67, "vertical_win": 71, "vf": 75, "vf_coef": [12, 75, 76], "vf_loss_coeff": 89, "via": [3, 8, 9, 10, 13, 38, 42, 54, 64, 65, 68, 70, 78, 97], "vice": 54, "video": [13, 14, 22, 28, 29, 35, 68, 70, 71, 72, 73, 75, 77], "video_check": 34, "video_checkers_v4": 34, "view": [3, 39, 47, 65, 75, 77, 87, 89, 96], "virtual": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "visibilty_level": 26, "visibl": [26, 54], "visit": 70, "visual": [11, 38, 41, 70, 91, 92], "visual_observ": 92, "visualis": [71, 72, 73], "vloss": 75, "volleybal": 13, "volleyball_pong": [35, 70], "volleyball_pong_v2": 35, "volleyball_pong_v3": 35, "volum": 13, "vulner": 43, "vwxyzjn": 75, "w": [39, 40, 41, 43, 71, 72, 73], "wa": [2, 4, 8, 10, 12, 13, 20, 41, 47, 64, 68, 70, 76, 80, 86], "wafer": 25, "wai": [2, 8, 13, 25, 62, 71, 80, 85], "wait": [71, 86], "wait_non": 86, "walk": [10, 40, 83], "walker": 65, "walker_0": 65, "walker_1": 65, "walker_2": 65, "walkthrough": 10, "wall": [17, 20, 26, 32, 41, 66, 80], "wandb": [70, 71, 72, 73, 75], "wandb_dict": 71, "wandb_ent": 75, "wandb_project_nam": 75, "wander": 54, "want": [6, 8, 9, 12, 59, 76], "war": 13, "warlord": [13, 37], "warlords_v3": 36, "warm": 71, "warm_up_oppon": 71, "warmup": 71, "warn": [4, 6, 8, 10, 11, 70, 79, 80, 86], "warn_action_out_of_bound": 4, "warn_on_illegal_mov": 4, "warn_step_after_terminated_trunc": 4, "warp": 71, "wasd": 38, "watch": [90, 92, 93, 94], "waterworld": [64, 70, 88, 91], "waterworld_v4": [64, 67, 70, 93], "wave": 24, "wb": 71, "wd": 70, "we": [2, 3, 6, 9, 10, 11, 12, 13, 43, 64, 70, 71, 76, 78, 79, 80, 81, 86, 90, 91, 92, 93], "weak": 71, "weak_rule_based_oppon": 71, "webassembli": 68, "webgl": 68, "websit": [2, 3, 70], "wed": 39, "wei": 42, "weight": [12, 41, 59, 61, 75, 76, 77], "weird": 9, "welcom": [70, 78], "well": [24, 37, 40, 47, 49, 65, 70, 90], "were": [13, 39, 40, 46, 47, 54, 70, 71], "what": [8, 11, 12, 40, 43, 47, 70, 74, 76, 90], "whatev": 90, "when": [4, 6, 8, 9, 10, 11, 12, 13, 16, 17, 20, 23, 24, 26, 27, 30, 31, 33, 36, 37, 39, 40, 44, 47, 54, 63, 65, 66, 67, 70, 71, 73, 74, 76, 90], "whenev": [2, 4, 15, 16, 17, 19, 31], "where": [1, 2, 3, 4, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 78, 79, 86, 91], "wherea": 2, "whether": [16, 40, 43, 44, 45, 46, 47, 48, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 75, 85], "which": [2, 3, 4, 5, 6, 8, 10, 11, 12, 13, 15, 18, 27, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 57, 59, 65, 66, 67, 70, 71, 76, 80, 85, 86, 87, 90, 92, 95], "while": [3, 4, 6, 7, 8, 9, 10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 46, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 69, 71, 76, 90], "white": [43, 46, 47, 66, 70], "white_0": 46, "who": [45, 70, 71], "whole": 40, "whose": [43, 44, 45, 46, 47, 48, 50, 51, 52, 67], "why": 4, "wide": [10, 40, 68, 69], "width": [12, 40, 71, 76], "willdudlei": [70, 94, 95, 97], "win": [26, 27, 34, 42, 48, 49, 71, 94], "win_rat": [71, 94], "window": [2, 3, 9, 10, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 66, 67, 70], "winnabl": 71, "winner": [43, 45, 46, 48, 49, 50, 51, 52, 90], "winning_act": 71, "winrat": 90, "wise": 13, "wish": [8, 10, 71, 87], "within": [6, 8, 9, 13, 14, 22, 28, 29, 33, 35, 39, 45, 47, 67, 78], "without": [9, 10, 20, 65, 70, 71, 72, 73, 75, 76, 79, 80, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "wizard": 13, "wizard_of_wor": [36, 37], "wizard_of_wor_v3": 37, "won": [9, 10, 33], "wor": 13, "word": 40, "work": [4, 8, 20, 25, 30, 45, 47, 48, 51, 54, 65, 67, 70, 81, 85, 90, 91], "workflow": 70, "world": [24, 40, 54, 66, 71], "worri": 71, "worth": [30, 71], "would": [2, 3, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 78], "wrap": [6, 7, 9, 10, 45, 48, 51, 70, 90, 95], "wrapped_env": 10, "wrapper": [2, 3, 4, 9, 13, 46, 68, 70, 71, 75, 87, 89, 90, 92], "writer": [75, 94], "written": [70, 96], "wrong": 43, "wu": 54, "www": 70, "x": [8, 12, 40, 41, 43, 46, 52, 59, 62, 63, 65, 66, 67, 75, 76, 79, 80, 86], "x11": 40, "x5": 40, "x_size": [8, 66, 72, 75, 89, 92], "xdist": 70, "xia": 42, "xixinzhang": 70, "y": [8, 13, 40, 43, 46, 65, 67, 71, 79, 80, 90, 92, 93], "y_pred": [12, 75, 76], "y_size": [8, 66, 72, 75, 89, 92], "y_true": [12, 75, 76], "yaml": 71, "yank": 70, "ye": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67], "year": [7, 8, 13, 42, 54, 64, 70], "yellow": 47, "yet": [8, 49], "yi": 54, "yield": [9, 90], "you": [1, 2, 3, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 75, 76, 78, 83, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 97], "younik": 70, "your": [2, 3, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 71, 72, 73, 75, 78, 79, 80, 83, 86, 87, 89], "yourself": [19, 20, 26], "yuanpu": 42, "zealand": 68, "zero": [4, 8, 12, 14, 18, 22, 27, 28, 29, 33, 34, 35, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 57, 65, 70, 71, 75, 76, 80, 88, 90], "zero_grad": [12, 75, 76], "zeros_lik": [12, 71, 75, 76], "zha": 42, "zha2019rlcard": 42, "zigzaging_bomb": 30, "zip": [10, 90, 92, 93], "zombi": [2, 4, 19, 20, 38, 70, 91]}, "titles": ["404 - Page Not Found", "PettingZoo docs", "AEC API", "Parallel API", "Utils", "Wrappers", "PettingZoo Wrappers", "Shimmy Compatibility Wrappers", "Supersuit Wrappers", "Basic Usage", "Environment Creation", "Testing Environments", "Tutorials", "Atari", "Basketball Pong", "Boxing", "Combat: Plane", "Combat: Tank", "Double Dunk", "Emtombed: Competitive", "Emtombed: Cooperative", "Flag Capture", "Foozpong", "Ice Hockey", "Joust", "Mario Bros", "Maze Craze", "Othello", "Pong", "Quadrapong", "Space Invaders", "Space War", "Surround", "Tennis", "Video Checkers", "Volleyball Pong", "Warlords", "Wizard of Wor", "Butterfly", "Cooperative Pong", "Knights Archers Zombies (\u2018KAZ\u2019)", "Pistonball", "Classic", "Chess", "Connect Four", "Gin Rummy", "Go", "Hanabi", "Leduc Hold\u2019em", "Rock Paper Scissors", "Texas Hold\u2019em", "Texas Hold\u2019em No Limit", "Tic Tac Toe", "<no title>", "MPE", "Simple", "Simple Adversary", "Simple Crypto", "Simple Push", "Simple Reference", "Simple Speaker Listener", "Simple Spread", "Simple Tag", "Simple World Comm", "SISL", "Multiwalker", "Pursuit", "Waterworld", "Third-Party Environments", "<no title>", "Release Notes", "AgileRL: Implementing DQN - Curriculum Learning and Self-play", "AgileRL: Implementing MADDPG", "AgileRL: Implementing MATD3", "AgileRL Tutorial", "CleanRL: Advanced PPO", "CleanRL: Implementing PPO", "CleanRL Tutorial", "Tutorial: Repository Structure", "Tutorial: Environment Logic", "Tutorial: Action Masking", "Tutorial: Testing Your Environment", "<no title>", "Custom Environment Tutorial", "<no title>", "LangChain Tutorial", "LangChain: Creating LLM agents", "RLlib: DQN for Simple Poker", "Ray RLlib Tutorial", "RLlib: PPO for Pistonball", "SB3: Action Masked PPO for Connect Four", "Stable-Baselines3 Tutorial", "SB3: PPO for Knights-Archers-Zombies", "SB3: PPO for Waterworld", "Tianshou: CLI and Logging", "Tianshou: Basic API Usage", "Tianshou Tutorial", "Tianshou: Training Agents"], "titleterms": {"0": 70, "1": 70, "10": 70, "11": 70, "12": 70, "13": 70, "14": 70, "15": 70, "16": 70, "17": 70, "18": 70, "19": 70, "2": 70, "20": 70, "21": 70, "22": 70, "23": 70, "24": 70, "3": 70, "4": 70, "404": 0, "5": 70, "6": 70, "7": 70, "8": 70, "9": 70, "No": [51, 86], "Not": 0, "The": 0, "With": 9, "about": 2, "action": [2, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 67, 80, 86, 90], "addit": [9, 78], "advanc": [75, 78], "adversari": 56, "aec": [2, 6, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68], "aecenv": 2, "agent": [4, 7, 8, 9, 10, 68, 71, 72, 73, 85, 86, 87, 89, 97], "agilerl": [71, 72, 73, 74], "ai": 68, "an": [1, 9], "api": [2, 3, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 95], "archer": [40, 92], "architectur": [88, 96], "argument": [39, 40, 41, 45, 46, 47, 49, 50, 51, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67], "atari": 13, "attribut": 2, "augment": 85, "averag": 4, "base": 40, "baselin": 91, "baselines3": 91, "basic": [9, 95], "basketbal": 14, "battl": 68, "battlesnak": 68, "benchmark": 11, "bombermanai": 68, "box": 15, "breakout": 68, "bro": 25, "build": 1, "butterfli": 38, "can": [71, 72, 73], "captur": [4, 21], "carla": 68, "cathedr": 68, "chain": 85, "check": 9, "checker": 34, "chess": 43, "citat": [7, 8, 13, 54], "classic": [42, 90], "cleanrl": [75, 76, 77], "cli": 94, "clone": 68, "code": [71, 72, 73, 75, 76, 78, 79, 80, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "cogment": 68, "combat": [16, 17], "comm": 63, "common": 13, "compat": 7, "competit": 19, "compon": 9, "concept": 54, "config": 71, "conflict_rez": 68, "connect": [44, 68, 71, 90], "control": [7, 39, 40, 66], "convers": 6, "cookingzoo": 68, "cooper": [20, 39], "could": 0, "craze": 26, "crazi": 68, "creat": 86, "creation": 10, "crypto": 57, "curriculum": 71, "custom": [10, 83], "cyber": 68, "cycl": 11, "data": 85, "death": 9, "deepmind": 7, "default": 40, "deprec": 10, "detail": 13, "develop": 10, "dilemma": 68, "doc": 1, "document": 1, "done": 9, "doubl": 18, "dqn": [71, 87], "drone": 68, "dsse": 68, "dunk": 18, "edit": 1, "em": [48, 50, 51], "emtomb": [19, 20], "entir": 9, "env": 68, "environ": [1, 7, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 47, 54, 68, 71, 72, 73, 75, 76, 79, 81, 83, 86, 87, 88, 89, 90, 92, 93, 94, 95, 97], "envlogg": 4, "evalu": [85, 90, 92, 93], "exampl": [2, 3, 10, 74, 77, 88, 96], "expand": 49, "fanorona": 68, "file": [71, 78], "flag": 21, "foozpong": 22, "found": 0, "four": [44, 68, 71, 90], "full": [71, 86], "function": 8, "galaga": 68, "game": [13, 49, 68], "gener": [71, 85], "gin": 45, "go": 46, "gobblet": 68, "ground": 68, "gym": 68, "gymnasium": 86, "hanabi": 47, "hearth": 68, "histori": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66], "hockei": 23, "hold": [48, 50, 51], "holdem": 86, "i": [9, 71, 72, 73], "ic": 23, "idiom": 9, "imag": 40, "implement": [71, 72, 73, 76], "import": 71, "includ": 8, "initi": 9, "instal": [9, 13, 38, 42, 54, 64], "integr": 77, "interact": [9, 68], "introduct": [78, 79, 80, 81], "invad": 30, "joust": 24, "kaggl": 68, "kaz": 40, "kei": 54, "knight": [40, 92], "langchain": [85, 86], "latest": 68, "learn": 71, "leduc": 48, "legal": [43, 44, 45, 46, 47, 48, 50, 51, 52], "limit": [51, 86], "listen": 60, "llm": [85, 86], "log": 94, "logic": 79, "loop": [71, 86], "maddpg": [72, 73], "manual": [39, 40, 66], "mario": 25, "mask": [2, 43, 44, 45, 46, 47, 48, 50, 51, 52, 80, 86, 90], "mat": 68, "matd3": 73, "max": 11, "maze": 26, "melt": 7, "memori": 85, "method": 2, "minim": [14, 21, 22, 27, 28, 29, 30, 32, 34, 35, 36], "mmo": 68, "model": 71, "modul": 10, "mpe": 54, "mu": 68, "multi": [7, 8], "multipl": [72, 73], "multiwalk": 65, "muzero": 68, "neural": 68, "notabl": 9, "note": 70, "number": 9, "observ": [4, 11, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 67], "older": 68, "onli": 8, "openspiel": 7, "oper": 68, "option": [9, 78], "othello": 27, "other": 90, "overview": [13, 74, 77, 85, 88, 91, 96], "page": [0, 1], "paper": [49, 86], "parallel": [3, 6, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67], "parallelenv": 3, "paramet": [13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "parti": 68, "perform": 11, "pettingzoo": [1, 6, 68, 70, 74, 77, 86, 88, 90, 96], "pistonbal": [41, 89], "plai": [71, 72, 73, 87, 89], "plane": 16, "pogema": 68, "poker": 87, "pong": [14, 28, 35, 39], "pot": 7, "ppo": [75, 76, 89, 90, 92, 93], "preprocess": 13, "prompt": 85, "pursuit": 66, "push": 58, "pz": 68, "quadrapong": 29, "racecar": 68, "rai": 88, "raw": 9, "recommend": 12, "refer": 59, "releas": 70, "render": [11, 54], "repositori": 78, "request": 0, "research": 68, "reward": [4, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 67], "rl": [68, 87, 89], "rllib": [87, 88, 89], "rock": [49, 86], "rummi": 45, "save": [4, 11], "sb3": [90, 92, 93], "scissor": [49, 86], "search": 68, "seed": 11, "selector": [4, 10], "self": 71, "sequenti": 68, "setup": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "shimmi": 7, "simpl": [55, 56, 57, 58, 59, 60, 61, 62, 63, 87], "sisl": 64, "skeleton": 78, "skyjo_rl": 68, "soccer": 7, "social": 68, "space": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 67], "speaker": 60, "spread": 61, "stabl": 91, "start": 12, "stdout": 4, "stone": 68, "structur": 78, "sumo": 68, "supersuit": 8, "support": 7, "surround": 32, "swarm": 68, "tac": [52, 86], "tactic": 68, "tag": 62, "tank": 17, "teamfight": 68, "tenni": 33, "termin": 54, "test": [1, 11, 81, 90], "texa": [50, 51, 86], "third": 68, "tianshou": [94, 95, 96, 97], "tic": [52, 86], "toe": [52, 86], "torer": 68, "total": 4, "train": [71, 72, 73, 87, 88, 89, 90, 92, 93, 97], "tree": 78, "tutori": [12, 74, 77, 78, 79, 80, 81, 83, 85, 88, 91, 96], "type": 54, "unwrap": 9, "us": [5, 10, 68, 71, 72, 73, 74, 77, 88, 96], "usag": [2, 3, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 95], "util": [4, 6, 10], "variabl": 9, "vector": 40, "vers": 68, "version": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 68], "video": 34, "volleybal": 35, "wandb": 77, "war": 31, "warlord": 36, "watch": [71, 72, 73, 87, 89], "waterworld": [67, 93], "weight": 71, "what": [71, 72, 73], "wizard": 37, "wor": 37, "world": 63, "wrapper": [5, 6, 7, 8, 10], "your": 81, "zombi": [40, 92]}}) \ No newline at end of file +Search.setIndex({"alltitles": {"0.18.1: 1.18.1": [[70, "release-0-18-1"]], "1.10.0": [[70, "release-1-10-0"]], "1.11.0": [[70, "release-1-11-0"]], "1.11.1": [[70, "release-1-11-1"]], "1.12.0": [[70, "release-1-12-0"]], "1.13.1": [[70, "release-1-13-1"]], "1.14.0": [[70, "release-1-14-0"]], "1.15.0": [[70, "release-1-15-0"]], "1.16.0": [[70, "release-1-16-0"]], "1.17.0": [[70, "release-1-17-0"]], "1.19.0": [[70, "release-1-19-0"]], "1.19.1": [[70, "release-1-19-1"]], "1.20.0": [[70, "release-1-20-0"]], "1.20.1": [[70, "release-1-20-1"]], "1.21.0": [[70, "release-1-21-0"]], "1.22.0": [[70, "release-1-22-0"]], "1.22.1": [[70, "release-1-22-1"]], "1.22.2": [[70, "release-1-22-2"]], "1.22.3": [[70, "release-1-22-3"]], "1.22.4": [[70, "release-1-22-4"]], "1.4.0": [[70, "release-1-4-0"]], "1.4.2": [[70, "release-1-4-2"]], "1.5.0": [[70, "release-1-5-0"]], "1.5.1": [[70, "release-1-5-1"]], "1.5.2": [[70, "release-1-5-2"]], "1.6.0": [[70, "release-1-6-0"]], "1.6.1": [[70, "release-1-6-1"]], "1.7.0": [[70, "release-1-7-0"]], "1.8.0": [[70, "release-1-8-0"]], "1.8.1": [[70, "release-1-8-1"]], "1.8.2": [[70, "release-1-8-2"]], "1.9.0": [[70, "release-1-9-0"]], "404 - Page Not Found": [[0, "page-not-found"]], "AEC": [[14, "aec"], [15, "aec"], [16, "aec"], [17, "aec"], [18, "aec"], [19, "aec"], [20, "aec"], [21, "aec"], [22, "aec"], [23, "aec"], [24, "aec"], [25, "aec"], [26, "aec"], [27, "aec"], [28, "aec"], [29, "aec"], [30, "aec"], [31, "aec"], [32, "aec"], [33, "aec"], [34, "aec"], [35, "aec"], [36, "aec"], [37, "aec"], [39, "aec"], [40, "aec"], [41, "aec"], [43, "aec"], [44, "aec"], [45, "aec"], [46, "aec"], [47, "aec"], [48, "aec"], [49, "aec"], [50, "aec"], [51, "aec"], [52, "aec"], [55, "aec"], [56, "aec"], [57, "aec"], [58, "aec"], [59, "aec"], [60, "aec"], [61, "aec"], [62, "aec"], [63, "aec"], [65, "aec"], [66, "aec"], [67, "aec"]], "AEC API": [[2, "aec-api"]], "AEC to Parallel": [[6, "module-pettingzoo.utils.conversions"]], "AECEnv": [[2, "aecenv"]], "API": [[14, "api"], [15, "api"], [16, "api"], [17, "api"], [18, "api"], [19, "api"], [20, "api"], [21, "api"], [22, "api"], [23, "api"], [24, "api"], [25, "api"], [26, "api"], [27, "api"], [28, "api"], [29, "api"], [30, "api"], [31, "api"], [32, "api"], [33, "api"], [34, "api"], [35, "api"], [36, "api"], [37, "api"], [39, "api"], [40, "api"], [41, "api"], [43, "api"], [44, "api"], [45, "api"], [46, "api"], [47, "api"], [48, "api"], [49, "api"], [50, "api"], [51, "api"], [52, "api"], [55, "api"], [56, "api"], [57, "api"], [58, "api"], [59, "api"], [60, "api"], [61, "api"], [62, "api"], [63, "api"], [65, "api"], [66, "api"], [67, "api"]], "API Test": [[11, "api-test"]], "About AEC": [[2, "about-aec"]], "Action Masking": [[2, "action-masking"]], "Action Masking Agent": [[86, "action-masking-agent"]], "Action Space": [[15, "action-space"], [16, "action-space"], [17, "action-space"], [18, "action-space"], [19, "action-space"], [20, "action-space"], [23, "action-space"], [24, "action-space"], [25, "action-space"], [26, "action-space"], [31, "action-space"], [33, "action-space"], [37, "action-space"], [43, "action-space"], [44, "action-space"], [45, "action-space"], [46, "action-space"], [47, "action-space"], [48, "action-space"], [49, "action-space"], [50, "action-space"], [51, "action-space"], [52, "action-space"], [54, "action-space"], [67, "action-space"]], "Action Space (Minimal)": [[14, "action-space-minimal"], [21, "action-space-minimal"], [22, "action-space-minimal"], [27, "action-space-minimal"], [28, "action-space-minimal"], [29, "action-space-minimal"], [30, "action-space-minimal"], [32, "action-space-minimal"], [34, "action-space-minimal"], [35, "action-space-minimal"], [36, "action-space-minimal"]], "Additional Environment API": [[9, "additional-environment-api"]], "Advanced: Additional (optional) files": [[78, "advanced-additional-optional-files"]], "Agent Selector": [[4, "agent-selector"]], "Agent selector": [[10, "agent-selector"]], "AgileRL Overview": [[74, "agilerl-overview"]], "AgileRL Tutorial": [[74, "agilerl-tutorial"]], "AgileRL: Implementing DQN - Curriculum Learning and Self-play": [[71, "agilerl-implementing-dqn-curriculum-learning-and-self-play"]], "AgileRL: Implementing MADDPG": [[72, "agilerl-implementing-maddpg"]], "AgileRL: Implementing MATD3": [[73, "agilerl-implementing-matd3"]], "Architecture": [[88, "architecture"], [96, "architecture"]], "Arguments": [[39, "arguments"], [40, "arguments"], [41, "arguments"], [45, "arguments"], [46, "arguments"], [49, "arguments"], [50, "arguments"], [51, "arguments"], [55, "arguments"], [56, "arguments"], [57, "arguments"], [58, "arguments"], [59, "arguments"], [60, "arguments"], [61, "arguments"], [62, "arguments"], [63, "arguments"], [65, "arguments"], [66, "arguments"], [67, "arguments"]], "Atari": [[13, "atari"]], "Attributes": [[2, "attributes"]], "Average Total Reward": [[4, "module-pettingzoo.utils.average_total_reward"]], "Basic Usage": [[9, "basic-usage"]], "Basketball Pong": [[14, "basketball-pong"]], "BomberManAI": [[68, "bombermanai"]], "Boxing": [[15, "boxing"]], "Breakout-Clone": [[68, "breakout-clone"]], "Build the Documentation": [[1, "build-the-documentation"]], "Butterfly": [[38, "butterfly"]], "Can I use it?": [[71, "can-i-use-it"], [72, "can-i-use-it"], [73, "can-i-use-it"]], "Capture Stdout": [[4, "capture-stdout"]], "Carla Gym": [[68, "carla-gym"]], "Cathedral-RL": [[68, "cathedral-rl"]], "Checking if the entire environment is done": [[9, "checking-if-the-entire-environment-is-done"]], "Chess": [[43, "chess"]], "Citation": [[7, "citation"], [8, "citation"], [13, "citation"], [54, "citation"]], "Classic": [[42, "classic"]], "CleanRL Overview": [[77, "cleanrl-overview"]], "CleanRL Tutorial": [[77, "cleanrl-tutorial"]], "CleanRL: Advanced PPO": [[75, "cleanrl-advanced-ppo"]], "CleanRL: Implementing PPO": [[76, "cleanrl-implementing-ppo"]], "Code": [[71, "code"], [72, "code"], [73, "code"], [75, "code"], [76, "code"], [79, "code"], [80, "code"], [81, "code"], [87, "code"], [89, "code"], [90, "code"], [92, "code"], [93, "code"], [94, "code"], [95, "code"], [97, "code"]], "Combat: Plane": [[16, "combat-plane"]], "Combat: Tank": [[17, "combat-tank"]], "Common Parameters": [[13, "common-parameters"]], "Config files": [[71, "config-files"]], "Connect Four": [[44, "connect-four"]], "Conversion wrappers": [[6, "conversion-wrappers"]], "CookingZoo": [[68, "cookingzoo"]], "Cooperative Pong": [[39, "cooperative-pong"]], "Crazy-RL": [[68, "crazy-rl"]], "Curriculum Learning": [[71, "curriculum-learning"]], "Curriculum learning and self-play using DQN on Connect Four": [[71, "curriculum-learning-and-self-play-using-dqn-on-connect-four"]], "Custom Environment Tutorial": [[83, "custom-environment-tutorial"]], "Cyber Operations Research Gym": [[68, "cyber-operations-research-gym"]], "DSSE: Drone Swarm Search Environment": [[68, "dsse-drone-swarm-search-environment"]], "DeepMind Control Soccer": [[7, "deepmind-control-soccer"]], "DeepMind Melting Pot": [[7, "deepmind-melting-pot"]], "Deprecated Module": [[10, "deprecated-module"]], "Developer Utils": [[10, "developer-utils"]], "Double Dunk": [[18, "double-dunk"]], "Editing an environment page": [[1, "editing-an-environment-page"]], "Emtombed: Competitive": [[19, "emtombed-competitive"]], "Emtombed: Cooperative": [[20, "emtombed-cooperative"]], "EnvLogger": [[4, "envlogger"]], "Environment Creation": [[10, "environment-creation"]], "Environment Details": [[13, "environment-details"]], "Environment Loop": [[86, "environment-loop"]], "Environment Setup": [[71, "environment-setup"], [72, "environment-setup"], [73, "environment-setup"], [75, "environment-setup"], [76, "environment-setup"], [86, "environment-setup"], [87, "environment-setup"], [89, "environment-setup"], [90, "environment-setup"], [92, "environment-setup"], [93, "environment-setup"], [94, "environment-setup"], [95, "environment-setup"], [97, "environment-setup"]], "Environment arguments": [[47, "environment-arguments"]], "Environment as an Agent": [[9, "environment-as-an-agent"]], "Environment parameters": [[14, "environment-parameters"], [15, "environment-parameters"], [16, "environment-parameters"], [17, "environment-parameters"], [18, "environment-parameters"], [19, "environment-parameters"], [20, "environment-parameters"], [21, "environment-parameters"], [22, "environment-parameters"], [23, "environment-parameters"], [24, "environment-parameters"], [25, "environment-parameters"], [26, "environment-parameters"], [27, "environment-parameters"], [28, "environment-parameters"], [29, "environment-parameters"], [30, "environment-parameters"], [31, "environment-parameters"], [32, "environment-parameters"], [33, "environment-parameters"], [34, "environment-parameters"], [35, "environment-parameters"], [36, "environment-parameters"], [37, "environment-parameters"]], "Environments using older versions of PettingZoo": [[68, "environments-using-older-versions-of-pettingzoo"]], "Environments using the latest versions of PettingZoo": [[68, "environments-using-the-latest-versions-of-pettingzoo"]], "Environments:": [[88, "environments"]], "Example Custom Environment": [[10, "example-custom-environment"]], "Example Custom Parallel Environment": [[10, "example-custom-parallel-environment"]], "Examples": [[2, "examples"], [3, "examples"]], "Examples using PettingZoo": [[74, "examples-using-pettingzoo"], [96, "examples-using-pettingzoo"]], "Examples using PettingZoo:": [[77, "examples-using-pettingzoo"], [88, "examples-using-pettingzoo"]], "Expanded Game": [[49, "expanded-game"], [49, "id3"]], "Fanorona AEC": [[68, "fanorona-aec"]], "Flag Capture": [[21, "flag-capture"]], "Foozpong": [[22, "foozpong"]], "Full Code": [[86, "full-code"]], "Full training code": [[71, "full-training-code"]], "Galaga AI": [[68, "galaga-ai"]], "Games Overview": [[13, "games-overview"]], "General setup": [[71, "general-setup"]], "Gin Rummy": [[45, "gin-rummy"]], "Go": [[46, "go"]], "Gobblet-RL": [[68, "gobblet-rl"]], "Gymnasium Agent": [[86, "gymnasium-agent"]], "Hanabi": [[47, "hanabi"]], "Ice Hockey": [[23, "ice-hockey"]], "Image-based": [[40, "image-based"]], "Imports": [[71, "imports"]], "Included Functions": [[8, "included-functions"]], "Included Multi-Agent Only Functions": [[8, "included-multi-agent-only-functions"]], "Initializing Environments": [[9, "initializing-environments"]], "Installation": [[9, "installation"], [13, "installation"], [38, "installation"], [42, "installation"], [54, "installation"], [64, "installation"]], "Interacting With Environments": [[9, "interacting-with-environments"]], "Interactive Connect Four": [[68, "interactive-connect-four"]], "Introduction": [[78, "introduction"], [79, "introduction"], [80, "introduction"], [81, "introduction"]], "Joust": [[24, "joust"]], "Kaggle Environments": [[68, "kaggle-environments"]], "Key Concepts": [[54, "key-concepts"]], "Knights Archers Zombies (\u2018KAZ\u2019)": [[40, "knights-archers-zombies-kaz"]], "LangChain Overview": [[85, "langchain-overview"]], "LangChain Tutorial": [[85, "langchain-tutorial"]], "LangChain: Creating LLM agents": [[86, "langchain-creating-llm-agents"]], "Leduc Hold\u2019em": [[48, "leduc-hold-em"]], "Legal Actions Mask": [[43, "legal-actions-mask"], [44, "legal-actions-mask"], [45, "legal-actions-mask"], [46, "legal-actions-mask"], [47, "legal-actions-mask"], [48, "legal-actions-mask"], [50, "legal-actions-mask"], [51, "legal-actions-mask"], [52, "legal-actions-mask"]], "MATS Gym": [[68, "mats-gym"]], "MPE": [[54, "mpe"]], "Manual Control": [[39, "manual-control"], [40, "manual-control"], [66, "manual-control"]], "Mario Bros": [[25, "mario-bros"]], "Max Cycles Test": [[11, "max-cycles-test"]], "Maze Craze": [[26, "maze-craze"]], "Methods": [[2, "methods"]], "Mu Torere": [[68, "mu-torere"]], "Multi-Agent Compatibility Wrappers:": [[7, "multi-agent-compatibility-wrappers"]], "Multiwalker": [[65, "multiwalker"]], "Neural MMO": [[68, "neural-mmo"]], "Notable Idioms": [[9, "notable-idioms"]], "Observation Saving": [[4, "module-pettingzoo.utils.save_observation"]], "Observation Space": [[43, "observation-space"], [44, "observation-space"], [45, "observation-space"], [46, "observation-space"], [47, "observation-space"], [48, "observation-space"], [49, "observation-space"], [50, "observation-space"], [51, "observation-space"], [52, "observation-space"], [54, "observation-space"], [65, "observation-space"], [67, "observation-space"]], "OpenSpiel": [[7, "openspiel"]], "Optional API Components": [[9, "optional-api-components"]], "Othello": [[27, "othello"]], "POGEMA": [[68, "pogema"]], "Parallel": [[14, "parallel"], [15, "parallel"], [16, "parallel"], [17, "parallel"], [18, "parallel"], [19, "parallel"], [20, "parallel"], [21, "parallel"], [22, "parallel"], [23, "parallel"], [24, "parallel"], [25, "parallel"], [26, "parallel"], [27, "parallel"], [28, "parallel"], [29, "parallel"], [30, "parallel"], [31, "parallel"], [32, "parallel"], [33, "parallel"], [34, "parallel"], [35, "parallel"], [36, "parallel"], [37, "parallel"], [39, "parallel"], [40, "parallel"], [41, "parallel"], [49, "parallel"], [55, "parallel"], [56, "parallel"], [57, "parallel"], [58, "parallel"], [59, "parallel"], [60, "parallel"], [61, "parallel"], [62, "parallel"], [63, "parallel"], [65, "parallel"], [66, "parallel"], [67, "parallel"]], "Parallel API": [[3, "parallel-api"]], "Parallel API Test": [[11, "parallel-api-test"]], "Parallel to AEC": [[6, "module-pettingzoo.utils.conversions"]], "ParallelEnv": [[3, "parallelenv"]], "Performance Benchmark Test": [[11, "performance-benchmark-test"]], "PettingZoo 1.23.0": [[70, "release-1-23-0"]], "PettingZoo 1.23.1": [[70, "release-1-23-1"]], "PettingZoo 1.24.0": [[70, "release-1-24-0"]], "PettingZoo 1.24.1": [[70, "release-1-24-1"]], "PettingZoo 1.24.2": [[70, "release-1-24-2"]], "PettingZoo 1.24.3": [[70, "release-1-24-3"]], "PettingZoo Agent": [[86, "pettingzoo-agent"]], "PettingZoo Dilemma Envs": [[68, "pettingzoo-dilemma-envs"]], "PettingZoo Wrappers": [[6, "pettingzoo-wrappers"]], "PettingZoo docs": [[1, "pettingzoo-docs"]], "Pistonball": [[41, "pistonball"]], "Pong": [[28, "pong"]], "Preprocessing": [[13, "preprocessing"]], "Pursuit": [[66, "pursuit"]], "Quadrapong": [[29, "quadrapong"]], "RLlib Overview": [[88, "rllib-overview"]], "RLlib: DQN for Simple Poker": [[87, "rllib-dqn-for-simple-poker"]], "RLlib: PPO for Pistonball": [[89, "rllib-ppo-for-pistonball"]], "Racecar Gym": [[68, "racecar-gym"]], "Raw Environments": [[9, "raw-environments"]], "Ray RLlib Tutorial": [[88, "ray-rllib-tutorial"]], "Recommended start": [[12, "recommended-start"]], "Release Notes": [[70, "release-notes"]], "Render Test": [[11, "render-test"]], "Rendering": [[54, "rendering"]], "Rewards": [[43, "rewards"], [44, "rewards"], [45, "rewards"], [46, "rewards"], [47, "rewards"], [48, "rewards"], [49, "rewards"], [50, "rewards"], [51, "rewards"], [52, "rewards"], [67, "rewards"]], "Rock Paper Scissors": [[49, "rock-paper-scissors"]], "Rock, Paper, Scissors": [[49, "id1"], [49, "id2"]], "Rock-Paper-Scissors": [[86, "rock-paper-scissors"]], "SB3: Action Masked PPO for Connect Four": [[90, "sb3-action-masked-ppo-for-connect-four"]], "SB3: PPO for Knights-Archers-Zombies": [[92, "sb3-ppo-for-knights-archers-zombies"]], "SB3: PPO for Waterworld": [[93, "sb3-ppo-for-waterworld"]], "SISL": [[64, "sisl"]], "SMAC and SMACv2 with latest PettingZoo APIs": [[68, "smac-and-smacv2-with-latest-pettingzoo-apis"]], "Save Observation Test": [[11, "save-observation-test"]], "Seed Test": [[11, "seed-test"]], "Self-play": [[71, "self-play"]], "Sequential Social Dilemma Games": [[68, "sequential-social-dilemma-games"]], "Shimmy Compatibility Wrappers": [[7, "shimmy-compatibility-wrappers"]], "Simple": [[55, "simple"]], "Simple Adversary": [[56, "simple-adversary"]], "Simple Crypto": [[57, "simple-crypto"]], "Simple Push": [[58, "simple-push"]], "Simple Reference": [[59, "simple-reference"]], "Simple Speaker Listener": [[60, "simple-speaker-listener"]], "Simple Spread": [[61, "simple-spread"]], "Simple Tag": [[62, "simple-tag"]], "Simple World Comm": [[63, "simple-world-comm"]], "Skeleton code": [[78, "skeleton-code"]], "Space Invaders": [[30, "space-invaders"]], "Space War": [[31, "space-war"]], "Stable-Baselines Overview": [[91, "stable-baselines-overview"]], "Stable-Baselines3 Tutorial": [[91, "stable-baselines3-tutorial"]], "Stone Ground Hearth Battles": [[68, "stone-ground-hearth-battles"]], "Sumo-RL": [[68, "sumo-rl"]], "Supersuit Wrappers": [[8, "supersuit-wrappers"]], "Supported multi-agent environments:": [[7, "supported-multi-agent-environments"]], "Surround": [[32, "surround"]], "Teamfight Tactics MuZero Agent": [[68, "teamfight-tactics-muzero-agent"]], "Tennis": [[33, "tennis"]], "Termination": [[54, "termination"]], "Test the documentation": [[1, "test-the-documentation"]], "Testing Environments": [[11, "testing-environments"]], "Testing other PettingZoo Classic environments": [[90, "testing-other-pettingzoo-classic-environments"]], "Texas Holdem\u2019 No Limit": [[86, "texas-holdem-no-limit"]], "Texas Hold\u2019em": [[50, "texas-hold-em"]], "Texas Hold\u2019em No Limit": [[51, "texas-hold-em-no-limit"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Third-Party Environments": [[68, "third-party-environments"]], "Tianshou Overview": [[96, "tianshou-overview"]], "Tianshou Tutorial": [[96, "tianshou-tutorial"]], "Tianshou: Basic API Usage": [[95, "tianshou-basic-api-usage"]], "Tianshou: CLI and Logging": [[94, "tianshou-cli-and-logging"]], "Tianshou: Training Agents": [[97, "tianshou-training-agents"]], "Tic Tac Toe": [[52, "tic-tac-toe"]], "Tic-Tac-Toe": [[86, "tic-tac-toe"]], "Train multiple agents using MADDPG": [[72, "train-multiple-agents-using-maddpg"], [73, "train-multiple-agents-using-maddpg"]], "Trained model weights": [[71, "trained-model-weights"]], "Training and Evaluation": [[90, "training-and-evaluation"], [92, "training-and-evaluation"], [93, "training-and-evaluation"]], "Training loop": [[71, "training-loop"]], "Training the RL agent": [[87, "training-the-rl-agent"], [89, "training-the-rl-agent"]], "Training:": [[88, "training"]], "Tree structure": [[78, "tree-structure"]], "Tutorial: Action Masking": [[80, "tutorial-action-masking"]], "Tutorial: Environment Logic": [[79, "tutorial-environment-logic"]], "Tutorial: Repository Structure": [[78, "tutorial-repository-structure"]], "Tutorial: Testing Your Environment": [[81, "tutorial-testing-your-environment"]], "Tutorials": [[12, "tutorials"]], "Types of Environments": [[54, "types-of-environments"]], "Unwrapping an environment": [[9, "unwrapping-an-environment"]], "Usage": [[2, "usage"], [3, "usage"], [7, "usage"], [13, "usage"], [14, "usage"], [15, "usage"], [16, "usage"], [17, "usage"], [18, "usage"], [19, "usage"], [20, "usage"], [21, "usage"], [22, "usage"], [23, "usage"], [24, "usage"], [25, "usage"], [26, "usage"], [27, "usage"], [28, "usage"], [29, "usage"], [30, "usage"], [31, "usage"], [32, "usage"], [33, "usage"], [34, "usage"], [35, "usage"], [36, "usage"], [37, "usage"], [38, "usage"], [39, "usage"], [40, "usage"], [41, "usage"], [42, "usage"], [43, "usage"], [44, "usage"], [45, "usage"], [46, "usage"], [47, "usage"], [48, "usage"], [49, "usage"], [50, "usage"], [51, "usage"], [52, "usage"], [54, "usage"], [55, "usage"], [56, "usage"], [57, "usage"], [58, "usage"], [59, "usage"], [60, "usage"], [61, "usage"], [62, "usage"], [63, "usage"], [64, "usage"], [65, "usage"], [66, "usage"], [67, "usage"]], "Using Wrappers": [[5, "using-wrappers"], [10, "using-wrappers"]], "Utility Wrappers": [[6, "utility-wrappers"]], "Utils": [[4, "utils"]], "Variable Numbers of Agents (Death)": [[9, "variable-numbers-of-agents-death"]], "Vectorized (Default)": [[40, "vectorized-default"]], "Version History": [[14, "version-history"], [15, "version-history"], [16, "version-history"], [17, "version-history"], [18, "version-history"], [19, "version-history"], [20, "version-history"], [21, "version-history"], [22, "version-history"], [23, "version-history"], [24, "version-history"], [25, "version-history"], [26, "version-history"], [27, "version-history"], [28, "version-history"], [29, "version-history"], [30, "version-history"], [31, "version-history"], [32, "version-history"], [33, "version-history"], [34, "version-history"], [35, "version-history"], [36, "version-history"], [37, "version-history"], [39, "version-history"], [40, "version-history"], [41, "version-history"], [43, "version-history"], [44, "version-history"], [45, "version-history"], [46, "version-history"], [47, "version-history"], [48, "version-history"], [49, "version-history"], [50, "version-history"], [51, "version-history"], [52, "version-history"], [65, "version-history"], [66, "version-history"]], "Video Checkers": [[34, "video-checkers"]], "Volleyball Pong": [[35, "volleyball-pong"]], "WandB Integration": [[77, "wandb-integration"]], "Warlords": [[36, "warlords"]], "Watch the trained agents play": [[71, "watch-the-trained-agents-play"], [72, "watch-the-trained-agents-play"], [73, "watch-the-trained-agents-play"]], "Watching the trained RL agent play": [[87, "watching-the-trained-rl-agent-play"], [89, "watching-the-trained-rl-agent-play"]], "Waterworld": [[67, "waterworld"]], "What is DQN?": [[71, "what-is-dqn"]], "What is MADDPG?": [[72, "what-is-maddpg"]], "What is MATD3?": [[73, "what-is-matd3"]], "Wizard of Wor": [[37, "wizard-of-wor"]], "Wrappers": [[5, "wrappers"]], "cogment-verse": [[68, "cogment-verse"]], "conflict_rez": [[68, "conflict-rez"]], "gfootball-gymnasium-pettingzoo": [[68, "gfootball-gymnasium-pettingzoo"]], "pz-battlesnake": [[68, "pz-battlesnake"]], "skyjo_rl": [[68, "skyjo-rl"]], "\ud83d\udcc3 LLMs and Prompts:": [[85, "llms-and-prompts"]], "\ud83d\udcda Data Augmented Generation:": [[85, "data-augmented-generation"]], "\ud83d\udd17 Chains:": [[85, "chains"]], "\ud83e\udd16 Agents:": [[85, "agents"]], "\ud83e\uddd0 Evaluation:": [[85, "evaluation"]], "\ud83e\udde0 Memory:": [[85, "memory"]]}, "docnames": ["404", "README", "api/aec", "api/parallel", "api/utils", "api/wrappers", "api/wrappers/pz_wrappers", "api/wrappers/shimmy_wrappers", "api/wrappers/supersuit_wrappers", "content/basic_usage", "content/environment_creation", "content/environment_tests", "content/tutorials", "environments/atari", "environments/atari/basketball_pong", "environments/atari/boxing", "environments/atari/combat_plane", "environments/atari/combat_tank", "environments/atari/double_dunk", "environments/atari/entombed_competitive", "environments/atari/entombed_cooperative", "environments/atari/flag_capture", "environments/atari/foozpong", "environments/atari/ice_hockey", "environments/atari/joust", "environments/atari/mario_bros", "environments/atari/maze_craze", "environments/atari/othello", "environments/atari/pong", "environments/atari/quadrapong", "environments/atari/space_invaders", "environments/atari/space_war", "environments/atari/surround", "environments/atari/tennis", "environments/atari/video_checkers", "environments/atari/volleyball_pong", "environments/atari/warlords", "environments/atari/wizard_of_wor", "environments/butterfly", "environments/butterfly/cooperative_pong", "environments/butterfly/knights_archers_zombies", "environments/butterfly/pistonball", "environments/classic", "environments/classic/chess", "environments/classic/connect_four", "environments/classic/gin_rummy", "environments/classic/go", "environments/classic/hanabi", "environments/classic/leduc_holdem", "environments/classic/rps", "environments/classic/texas_holdem", "environments/classic/texas_holdem_no_limit", "environments/classic/tictactoe", "environments/envs", "environments/mpe", "environments/mpe/simple", "environments/mpe/simple_adversary", "environments/mpe/simple_crypto", "environments/mpe/simple_push", "environments/mpe/simple_reference", "environments/mpe/simple_speaker_listener", "environments/mpe/simple_spread", "environments/mpe/simple_tag", "environments/mpe/simple_world_comm", "environments/sisl", "environments/sisl/multiwalker", "environments/sisl/pursuit", "environments/sisl/waterworld", "environments/third_party_envs", "index", "release_notes/index", "tutorials/agilerl/DQN", "tutorials/agilerl/MADDPG", "tutorials/agilerl/MATD3", "tutorials/agilerl/index", "tutorials/cleanrl/advanced_PPO", "tutorials/cleanrl/implementing_PPO", "tutorials/cleanrl/index", "tutorials/custom_environment/1-project-structure", "tutorials/custom_environment/2-environment-logic", "tutorials/custom_environment/3-action-masking", "tutorials/custom_environment/4-testing-your-environment", "tutorials/custom_environment/5-using-your-environment", "tutorials/custom_environment/index", "tutorials/index", "tutorials/langchain/index", "tutorials/langchain/langchain", "tutorials/rllib/holdem", "tutorials/rllib/index", "tutorials/rllib/pistonball", "tutorials/sb3/connect_four", "tutorials/sb3/index", "tutorials/sb3/kaz", "tutorials/sb3/waterworld", "tutorials/tianshou/advanced", "tutorials/tianshou/beginner", "tutorials/tianshou/index", "tutorials/tianshou/intermediate"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/aec.md", "api/parallel.md", "api/utils.md", "api/wrappers.md", "api/wrappers/pz_wrappers.md", "api/wrappers/shimmy_wrappers.md", "api/wrappers/supersuit_wrappers.md", "content/basic_usage.md", "content/environment_creation.md", "content/environment_tests.md", "content/tutorials.md", "environments/atari.md", "environments/atari/basketball_pong.md", "environments/atari/boxing.md", "environments/atari/combat_plane.md", "environments/atari/combat_tank.md", "environments/atari/double_dunk.md", "environments/atari/entombed_competitive.md", "environments/atari/entombed_cooperative.md", "environments/atari/flag_capture.md", "environments/atari/foozpong.md", "environments/atari/ice_hockey.md", "environments/atari/joust.md", "environments/atari/mario_bros.md", "environments/atari/maze_craze.md", "environments/atari/othello.md", "environments/atari/pong.md", "environments/atari/quadrapong.md", "environments/atari/space_invaders.md", "environments/atari/space_war.md", "environments/atari/surround.md", "environments/atari/tennis.md", "environments/atari/video_checkers.md", "environments/atari/volleyball_pong.md", "environments/atari/warlords.md", "environments/atari/wizard_of_wor.md", "environments/butterfly.md", "environments/butterfly/cooperative_pong.md", "environments/butterfly/knights_archers_zombies.md", "environments/butterfly/pistonball.md", "environments/classic.md", "environments/classic/chess.md", "environments/classic/connect_four.md", "environments/classic/gin_rummy.md", "environments/classic/go.md", "environments/classic/hanabi.md", "environments/classic/leduc_holdem.md", "environments/classic/rps.md", "environments/classic/texas_holdem.md", "environments/classic/texas_holdem_no_limit.md", "environments/classic/tictactoe.md", "environments/envs.md", "environments/mpe.md", "environments/mpe/simple.md", "environments/mpe/simple_adversary.md", "environments/mpe/simple_crypto.md", "environments/mpe/simple_push.md", "environments/mpe/simple_reference.md", "environments/mpe/simple_speaker_listener.md", "environments/mpe/simple_spread.md", "environments/mpe/simple_tag.md", "environments/mpe/simple_world_comm.md", "environments/sisl.md", "environments/sisl/multiwalker.md", "environments/sisl/pursuit.md", "environments/sisl/waterworld.md", "environments/third_party_envs.md", "index.md", "release_notes/index.md", "tutorials/agilerl/DQN.md", "tutorials/agilerl/MADDPG.md", "tutorials/agilerl/MATD3.md", "tutorials/agilerl/index.md", "tutorials/cleanrl/advanced_PPO.md", "tutorials/cleanrl/implementing_PPO.md", "tutorials/cleanrl/index.md", "tutorials/custom_environment/1-project-structure.md", "tutorials/custom_environment/2-environment-logic.md", "tutorials/custom_environment/3-action-masking.md", "tutorials/custom_environment/4-testing-your-environment.md", "tutorials/custom_environment/5-using-your-environment.md", "tutorials/custom_environment/index.md", "tutorials/index.md", "tutorials/langchain/index.md", "tutorials/langchain/langchain.md", "tutorials/rllib/holdem.md", "tutorials/rllib/index.md", "tutorials/rllib/pistonball.md", "tutorials/sb3/connect_four.md", "tutorials/sb3/index.md", "tutorials/sb3/kaz.md", "tutorials/sb3/waterworld.md", "tutorials/tianshou/advanced.md", "tutorials/tianshou/beginner.md", "tutorials/tianshou/index.md", "tutorials/tianshou/intermediate.md"], "indexentries": {"action_space() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.action_space", false]], "action_space() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.action_space", false]], "action_space() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.action_space", false]], "action_space() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.action_space", false]], "action_space() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.action_space", false]], "action_space() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.action_space", false]], "action_space() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.action_space", false]], "action_space() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.action_space", false]], "action_space() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.action_space", false]], "action_space() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.action_space", false]], "action_space() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.action_space", false]], "action_space() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.action_space", false]], "action_space() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.action_space", false]], "action_spaces (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.action_spaces", false]], "action_spaces (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.action_spaces", false]], "aec_to_parallel() (in module pettingzoo.utils.conversions)": [[6, "pettingzoo.utils.conversions.aec_to_parallel", false]], "aecenv (class in pettingzoo.utils.env)": [[2, "pettingzoo.utils.env.AECEnv", false]], "agent_indicator_v0()": [[8, "agent_indicator_v0", false]], "agent_selection (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.agent_selection", false]], "agent_selector (class in pettingzoo.utils.agent_selector)": [[4, "pettingzoo.utils.agent_selector.agent_selector", false]], "agents (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.agents", false]], "agents (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.agents", false]], "agentselector (class in pettingzoo.utils.agent_selector)": [[4, "pettingzoo.utils.agent_selector.AgentSelector", false]], "assertoutofboundswrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.AssertOutOfBoundsWrapper", false]], "average_total_reward() (in module pettingzoo.utils.average_total_reward)": [[4, "pettingzoo.utils.average_total_reward.average_total_reward", false]], "basewrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.BaseWrapper", false]], "black_death_v2()": [[8, "black_death_v2", false]], "built-in function": [[8, "agent_indicator_v0", false], [8, "black_death_v2", false], [8, "clip_actions_v0", false], [8, "clip_reward_v0", false], [8, "color_reduction_v0", false], [8, "delay_observations_v0", false], [8, "dtype_v0", false], [8, "flatten_v0", false], [8, "frame_skip_v0", false], [8, "frame_stack_v1", false], [8, "max_observation_v0", false], [8, "nan_noop_v0", false], [8, "nan_random_v0", false], [8, "nan_zeros_v0", false], [8, "normalize_obs_v0", false], [8, "pad_action_space_v0", false], [8, "pad_observations_v0", false], [8, "reshape_v0", false], [8, "resize_v1", false], [8, "scale_actions_v0", false], [8, "sticky_actions_v0", false]], "capture_stdout (class in pettingzoo.utils.capture_stdout)": [[4, "pettingzoo.utils.capture_stdout.capture_stdout", false]], "capturestdoutwrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.CaptureStdoutWrapper", false]], "clip_actions_v0()": [[8, "clip_actions_v0", false]], "clip_reward_v0()": [[8, "clip_reward_v0", false]], "clipoutofboundswrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.ClipOutOfBoundsWrapper", false]], "close() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.close", false]], "close() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.close", false]], "close() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.close", false]], "close() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.close", false]], "close() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.close", false]], "close() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.close", false]], "close() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.close", false]], "close() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.close", false]], "close() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.close", false]], "close() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.close", false]], "close() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.close", false]], "close() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.close", false]], "close() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.close", false]], "close() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.close", false]], "color_reduction_v0()": [[8, "color_reduction_v0", false]], "delay_observations_v0()": [[8, "delay_observations_v0", false]], "dtype_v0()": [[8, "dtype_v0", false]], "env (class in pettingzoo.butterfly.cooperative_pong.cooperative_pong)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.env", false]], "env (class in pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.env", false]], "env (class in pettingzoo.butterfly.pistonball.pistonball)": [[41, "pettingzoo.butterfly.pistonball.pistonball.env", false]], "env (class in pettingzoo.classic.chess.chess)": [[43, "pettingzoo.classic.chess.chess.env", false]], "env (class in pettingzoo.classic.connect_four.connect_four)": [[44, "pettingzoo.classic.connect_four.connect_four.env", false]], "env (class in pettingzoo.classic.go.go)": [[46, "pettingzoo.classic.go.go.env", false]], "env (class in pettingzoo.classic.hanabi.hanabi)": [[47, "pettingzoo.classic.hanabi.hanabi.env", false]], "env (class in pettingzoo.classic.rlcard_envs.gin_rummy)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.env", false]], "env (class in pettingzoo.classic.rlcard_envs.leduc_holdem)": [[48, "pettingzoo.classic.rlcard_envs.leduc_holdem.env", false]], "env (class in pettingzoo.classic.rlcard_envs.texas_holdem)": [[50, "pettingzoo.classic.rlcard_envs.texas_holdem.env", false]], "env (class in pettingzoo.classic.rlcard_envs.texas_holdem_no_limit)": [[51, "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.env", false]], "env (class in pettingzoo.classic.rps.rps)": [[49, "pettingzoo.classic.rps.rps.env", false]], "env (class in pettingzoo.classic.tictactoe.tictactoe)": [[52, "pettingzoo.classic.tictactoe.tictactoe.env", false]], "env (class in pettingzoo.sisl.multiwalker.multiwalker)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.env", false]], "env (class in pettingzoo.sisl.pursuit.pursuit)": [[66, "pettingzoo.sisl.pursuit.pursuit.env", false]], "env (class in pettingzoo.sisl.waterworld.waterworld)": [[67, "pettingzoo.sisl.waterworld.waterworld.env", false]], "envlogger (class in pettingzoo.utils.env_logger)": [[4, "pettingzoo.utils.env_logger.EnvLogger", false]], "error_agent_iter_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_agent_iter_before_reset", false]], "error_nan_action() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_nan_action", false]], "error_observe_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_observe_before_reset", false]], "error_possible_agents_attribute_missing() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_possible_agents_attribute_missing", false]], "error_render_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_render_before_reset", false]], "error_state_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_state_before_reset", false]], "error_step_before_reset() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.error_step_before_reset", false]], "flatten_v0()": [[8, "flatten_v0", false]], "flush() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.flush", false]], "frame_skip_v0()": [[8, "frame_skip_v0", false]], "frame_stack_v1()": [[8, "frame_stack_v1", false]], "get_logger() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.get_logger", false]], "infos (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.infos", false]], "is_first() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.is_first", false]], "is_last() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.is_last", false]], "max_num_agents (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.max_num_agents", false]], "max_num_agents (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.max_num_agents", false]], "max_observation_v0()": [[8, "max_observation_v0", false]], "module": [[4, "module-pettingzoo.utils.agent_selector", false], [4, "module-pettingzoo.utils.average_total_reward", false], [4, "module-pettingzoo.utils.capture_stdout", false], [4, "module-pettingzoo.utils.save_observation", false], [6, "module-pettingzoo.utils.conversions", false]], "mqueue (pettingzoo.utils.env_logger.envlogger attribute)": [[4, "pettingzoo.utils.env_logger.EnvLogger.mqueue", false]], "nan_noop_v0()": [[8, "nan_noop_v0", false]], "nan_random_v0()": [[8, "nan_random_v0", false]], "nan_zeros_v0()": [[8, "nan_zeros_v0", false]], "next() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.next", false]], "normalize_obs_v0()": [[8, "normalize_obs_v0", false]], "num_agents (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.num_agents", false]], "num_agents (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.num_agents", false]], "observation_space() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.observation_space", false]], "observation_space() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.observation_space", false]], "observation_space() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.observation_space", false]], "observation_space() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.observation_space", false]], "observation_space() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.observation_space", false]], "observation_space() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.observation_space", false]], "observation_space() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.observation_space", false]], "observation_space() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.observation_space", false]], "observation_spaces (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.observation_spaces", false]], "observation_spaces (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.observation_spaces", false]], "observe() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.observe", false]], "observe() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.observe", false]], "observe() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.observe", false]], "observe() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.observe", false]], "observe() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.observe", false]], "observe() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.observe", false]], "observe() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.observe", false]], "observe() (pettingzoo.classic.rlcard_envs.gin_rummy.raw_env method)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env.observe", false]], "observe() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.observe", false]], "observe() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.observe", false]], "observe() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.observe", false]], "observe() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.observe", false]], "observe() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.observe", false]], "observe() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.observe", false]], "orderenforcingwrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.OrderEnforcingWrapper", false]], "pad_action_space_v0()": [[8, "pad_action_space_v0", false]], "pad_observations_v0()": [[8, "pad_observations_v0", false]], "parallel_to_aec() (in module pettingzoo.utils.conversions)": [[6, "pettingzoo.utils.conversions.parallel_to_aec", false]], "parallelenv (class in pettingzoo.utils.env)": [[3, "pettingzoo.utils.env.ParallelEnv", false]], "pettingzoo.utils.agent_selector": [[4, "module-pettingzoo.utils.agent_selector", false]], "pettingzoo.utils.average_total_reward": [[4, "module-pettingzoo.utils.average_total_reward", false]], "pettingzoo.utils.capture_stdout": [[4, "module-pettingzoo.utils.capture_stdout", false]], "pettingzoo.utils.conversions": [[6, "module-pettingzoo.utils.conversions", false]], "pettingzoo.utils.save_observation": [[4, "module-pettingzoo.utils.save_observation", false]], "possible_agents (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.possible_agents", false]], "possible_agents (pettingzoo.utils.env.parallelenv attribute)": [[3, "pettingzoo.utils.env.ParallelEnv.possible_agents", false]], "raw_env (class in pettingzoo.atari.basketball_pong.basketball_pong)": [[14, "pettingzoo.atari.basketball_pong.basketball_pong.raw_env", false]], "raw_env (class in pettingzoo.atari.boxing.boxing)": [[15, "pettingzoo.atari.boxing.boxing.raw_env", false]], "raw_env (class in pettingzoo.atari.combat_plane.combat_plane)": [[16, "pettingzoo.atari.combat_plane.combat_plane.raw_env", false]], "raw_env (class in pettingzoo.atari.combat_tank.combat_tank)": [[17, "pettingzoo.atari.combat_tank.combat_tank.raw_env", false]], "raw_env (class in pettingzoo.atari.double_dunk.double_dunk)": [[18, "pettingzoo.atari.double_dunk.double_dunk.raw_env", false]], "raw_env (class in pettingzoo.atari.entombed_competitive.entombed_competitive)": [[19, "pettingzoo.atari.entombed_competitive.entombed_competitive.raw_env", false]], "raw_env (class in pettingzoo.atari.entombed_cooperative.entombed_cooperative)": [[20, "pettingzoo.atari.entombed_cooperative.entombed_cooperative.raw_env", false]], "raw_env (class in pettingzoo.atari.flag_capture.flag_capture)": [[21, "pettingzoo.atari.flag_capture.flag_capture.raw_env", false]], "raw_env (class in pettingzoo.atari.foozpong.foozpong)": [[22, "pettingzoo.atari.foozpong.foozpong.raw_env", false]], "raw_env (class in pettingzoo.atari.ice_hockey.ice_hockey)": [[23, "pettingzoo.atari.ice_hockey.ice_hockey.raw_env", false]], "raw_env (class in pettingzoo.atari.joust.joust)": [[24, "pettingzoo.atari.joust.joust.raw_env", false]], "raw_env (class in pettingzoo.atari.mario_bros.mario_bros)": [[25, "pettingzoo.atari.mario_bros.mario_bros.raw_env", false]], "raw_env (class in pettingzoo.atari.maze_craze.maze_craze)": [[26, "pettingzoo.atari.maze_craze.maze_craze.raw_env", false]], "raw_env (class in pettingzoo.atari.othello.othello)": [[27, "pettingzoo.atari.othello.othello.raw_env", false]], "raw_env (class in pettingzoo.atari.pong.pong)": [[28, "pettingzoo.atari.pong.pong.raw_env", false]], "raw_env (class in pettingzoo.atari.quadrapong.quadrapong)": [[29, "pettingzoo.atari.quadrapong.quadrapong.raw_env", false]], "raw_env (class in pettingzoo.atari.space_invaders.space_invaders)": [[30, "pettingzoo.atari.space_invaders.space_invaders.raw_env", false]], "raw_env (class in pettingzoo.atari.space_war.space_war)": [[31, "pettingzoo.atari.space_war.space_war.raw_env", false]], "raw_env (class in pettingzoo.atari.surround.surround)": [[32, "pettingzoo.atari.surround.surround.raw_env", false]], "raw_env (class in pettingzoo.atari.tennis.tennis)": [[33, "pettingzoo.atari.tennis.tennis.raw_env", false]], "raw_env (class in pettingzoo.atari.video_checkers.video_checkers)": [[34, "pettingzoo.atari.video_checkers.video_checkers.raw_env", false]], "raw_env (class in pettingzoo.atari.volleyball_pong.volleyball_pong)": [[35, "pettingzoo.atari.volleyball_pong.volleyball_pong.raw_env", false]], "raw_env (class in pettingzoo.atari.warlords.warlords)": [[36, "pettingzoo.atari.warlords.warlords.raw_env", false]], "raw_env (class in pettingzoo.atari.wizard_of_wor.wizard_of_wor)": [[37, "pettingzoo.atari.wizard_of_wor.wizard_of_wor.raw_env", false]], "raw_env (class in pettingzoo.butterfly.cooperative_pong.cooperative_pong)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env", false]], "raw_env (class in pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env", false]], "raw_env (class in pettingzoo.butterfly.pistonball.pistonball)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env", false]], "raw_env (class in pettingzoo.classic.chess.chess)": [[43, "pettingzoo.classic.chess.chess.raw_env", false]], "raw_env (class in pettingzoo.classic.connect_four.connect_four)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env", false]], "raw_env (class in pettingzoo.classic.go.go)": [[46, "pettingzoo.classic.go.go.raw_env", false]], "raw_env (class in pettingzoo.classic.hanabi.hanabi)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env", false]], "raw_env (class in pettingzoo.classic.rlcard_envs.gin_rummy)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env", false]], "raw_env (class in pettingzoo.classic.rlcard_envs.leduc_holdem)": [[48, "pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env", false]], "raw_env (class in pettingzoo.classic.rlcard_envs.texas_holdem)": [[50, "pettingzoo.classic.rlcard_envs.texas_holdem.raw_env", false]], "raw_env (class in pettingzoo.classic.rlcard_envs.texas_holdem_no_limit)": [[51, "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env", false]], "raw_env (class in pettingzoo.classic.rps.rps)": [[49, "pettingzoo.classic.rps.rps.raw_env", false]], "raw_env (class in pettingzoo.classic.tictactoe.tictactoe)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple.simple)": [[55, "pettingzoo.mpe.simple.simple.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_adversary.simple_adversary)": [[56, "pettingzoo.mpe.simple_adversary.simple_adversary.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_crypto.simple_crypto)": [[57, "pettingzoo.mpe.simple_crypto.simple_crypto.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_push.simple_push)": [[58, "pettingzoo.mpe.simple_push.simple_push.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_reference.simple_reference)": [[59, "pettingzoo.mpe.simple_reference.simple_reference.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_speaker_listener.simple_speaker_listener)": [[60, "pettingzoo.mpe.simple_speaker_listener.simple_speaker_listener.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_spread.simple_spread)": [[61, "pettingzoo.mpe.simple_spread.simple_spread.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_tag.simple_tag)": [[62, "pettingzoo.mpe.simple_tag.simple_tag.raw_env", false]], "raw_env (class in pettingzoo.mpe.simple_world_comm.simple_world_comm)": [[63, "pettingzoo.mpe.simple_world_comm.simple_world_comm.raw_env", false]], "raw_env (class in pettingzoo.sisl.multiwalker.multiwalker)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env", false]], "raw_env (class in pettingzoo.sisl.pursuit.pursuit)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env", false]], "raw_env (class in pettingzoo.sisl.waterworld.waterworld)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env", false]], "reinit() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.reinit", false]], "render() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.render", false]], "render() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.render", false]], "render() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.render", false]], "render() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.render", false]], "render() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.render", false]], "render() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.render", false]], "render() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.render", false]], "render() (pettingzoo.classic.rlcard_envs.gin_rummy.raw_env method)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env.render", false]], "render() (pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env method)": [[48, "pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env.render", false]], "render() (pettingzoo.classic.rlcard_envs.texas_holdem.raw_env method)": [[50, "pettingzoo.classic.rlcard_envs.texas_holdem.raw_env.render", false]], "render() (pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env method)": [[51, "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env.render", false]], "render() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.render", false]], "render() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.render", false]], "render() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.render", false]], "render() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.render", false]], "render() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.render", false]], "render() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.render", false]], "render() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.render", false]], "reset() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.reset", false]], "reset() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.reset", false]], "reset() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.reset", false]], "reset() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.reset", false]], "reset() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.reset", false]], "reset() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.reset", false]], "reset() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.reset", false]], "reset() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.reset", false]], "reset() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.reset", false]], "reset() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.reset", false]], "reset() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.reset", false]], "reset() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.reset", false]], "reset() (pettingzoo.utils.agent_selector.agentselector method)": [[4, "pettingzoo.utils.agent_selector.AgentSelector.reset", false]], "reset() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.reset", false]], "reset() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.reset", false]], "reshape_v0()": [[8, "reshape_v0", false]], "resize_v1()": [[8, "resize_v1", false]], "rewards (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.rewards", false]], "save_observation() (in module pettingzoo.utils.save_observation)": [[4, "pettingzoo.utils.save_observation.save_observation", false]], "scale_actions_v0()": [[8, "scale_actions_v0", false]], "state() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.state", false]], "state() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.state", false]], "state() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.state", false]], "state() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.state", false]], "state() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.state", false]], "step() (pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env method)": [[39, "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env.step", false]], "step() (pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env method)": [[40, "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env.step", false]], "step() (pettingzoo.butterfly.pistonball.pistonball.raw_env method)": [[41, "pettingzoo.butterfly.pistonball.pistonball.raw_env.step", false]], "step() (pettingzoo.classic.chess.chess.raw_env method)": [[43, "pettingzoo.classic.chess.chess.raw_env.step", false]], "step() (pettingzoo.classic.connect_four.connect_four.raw_env method)": [[44, "pettingzoo.classic.connect_four.connect_four.raw_env.step", false]], "step() (pettingzoo.classic.go.go.raw_env method)": [[46, "pettingzoo.classic.go.go.raw_env.step", false]], "step() (pettingzoo.classic.hanabi.hanabi.raw_env method)": [[47, "pettingzoo.classic.hanabi.hanabi.raw_env.step", false]], "step() (pettingzoo.classic.rlcard_envs.gin_rummy.raw_env method)": [[45, "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env.step", false]], "step() (pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env method)": [[48, "pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env.step", false]], "step() (pettingzoo.classic.rlcard_envs.texas_holdem.raw_env method)": [[50, "pettingzoo.classic.rlcard_envs.texas_holdem.raw_env.step", false]], "step() (pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env method)": [[51, "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env.step", false]], "step() (pettingzoo.classic.rps.rps.raw_env method)": [[49, "pettingzoo.classic.rps.rps.raw_env.step", false]], "step() (pettingzoo.classic.tictactoe.tictactoe.raw_env method)": [[52, "pettingzoo.classic.tictactoe.tictactoe.raw_env.step", false]], "step() (pettingzoo.sisl.multiwalker.multiwalker.raw_env method)": [[65, "pettingzoo.sisl.multiwalker.multiwalker.raw_env.step", false]], "step() (pettingzoo.sisl.pursuit.pursuit.raw_env method)": [[66, "pettingzoo.sisl.pursuit.pursuit.raw_env.step", false]], "step() (pettingzoo.sisl.waterworld.waterworld.raw_env method)": [[67, "pettingzoo.sisl.waterworld.waterworld.raw_env.step", false]], "step() (pettingzoo.utils.env.aecenv method)": [[2, "pettingzoo.utils.env.AECEnv.step", false]], "step() (pettingzoo.utils.env.parallelenv method)": [[3, "pettingzoo.utils.env.ParallelEnv.step", false]], "sticky_actions_v0()": [[8, "sticky_actions_v0", false]], "suppress_output() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.suppress_output", false]], "terminateillegalwrapper (class in pettingzoo.utils.wrappers)": [[6, "pettingzoo.utils.wrappers.TerminateIllegalWrapper", false]], "terminations (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.terminations", false]], "truncations (pettingzoo.utils.env.aecenv attribute)": [[2, "pettingzoo.utils.env.AECEnv.truncations", false]], "unsuppress_output() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.unsuppress_output", false]], "warn_action_out_of_bound() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.warn_action_out_of_bound", false]], "warn_on_illegal_move() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.warn_on_illegal_move", false]], "warn_step_after_terminated_truncated() (pettingzoo.utils.env_logger.envlogger static method)": [[4, "pettingzoo.utils.env_logger.EnvLogger.warn_step_after_terminated_truncated", false]]}, "objects": {"": [[8, 0, 1, "", "agent_indicator_v0"], [8, 0, 1, "", "black_death_v2"], [8, 0, 1, "", "clip_actions_v0"], [8, 0, 1, "", "clip_reward_v0"], [8, 0, 1, "", "color_reduction_v0"], [8, 0, 1, "", "delay_observations_v0"], [8, 0, 1, "", "dtype_v0"], [8, 0, 1, "", "flatten_v0"], [8, 0, 1, "", "frame_skip_v0"], [8, 0, 1, "", "frame_stack_v1"], [8, 0, 1, "", "max_observation_v0"], [8, 0, 1, "", "nan_noop_v0"], [8, 0, 1, "", "nan_random_v0"], [8, 0, 1, "", "nan_zeros_v0"], [8, 0, 1, "", "normalize_obs_v0"], [8, 0, 1, "", "pad_action_space_v0"], [8, 0, 1, "", "pad_observations_v0"], [8, 0, 1, "", "reshape_v0"], [8, 0, 1, "", "resize_v1"], [8, 0, 1, "", "scale_actions_v0"], [8, 0, 1, "", "sticky_actions_v0"]], "pettingzoo.atari.basketball_pong.basketball_pong": [[14, 1, 1, "", "raw_env"]], "pettingzoo.atari.boxing.boxing": [[15, 1, 1, "", "raw_env"]], "pettingzoo.atari.combat_plane.combat_plane": [[16, 1, 1, "", "raw_env"]], "pettingzoo.atari.combat_tank.combat_tank": [[17, 1, 1, "", "raw_env"]], "pettingzoo.atari.double_dunk.double_dunk": [[18, 1, 1, "", "raw_env"]], "pettingzoo.atari.entombed_competitive.entombed_competitive": [[19, 1, 1, "", "raw_env"]], "pettingzoo.atari.entombed_cooperative.entombed_cooperative": [[20, 1, 1, "", "raw_env"]], "pettingzoo.atari.flag_capture.flag_capture": [[21, 1, 1, "", "raw_env"]], "pettingzoo.atari.foozpong.foozpong": [[22, 1, 1, "", "raw_env"]], "pettingzoo.atari.ice_hockey.ice_hockey": [[23, 1, 1, "", "raw_env"]], "pettingzoo.atari.joust.joust": [[24, 1, 1, "", "raw_env"]], "pettingzoo.atari.mario_bros.mario_bros": [[25, 1, 1, "", "raw_env"]], "pettingzoo.atari.maze_craze.maze_craze": [[26, 1, 1, "", "raw_env"]], "pettingzoo.atari.othello.othello": [[27, 1, 1, "", "raw_env"]], "pettingzoo.atari.pong.pong": [[28, 1, 1, "", "raw_env"]], "pettingzoo.atari.quadrapong.quadrapong": [[29, 1, 1, "", "raw_env"]], "pettingzoo.atari.space_invaders.space_invaders": [[30, 1, 1, "", "raw_env"]], "pettingzoo.atari.space_war.space_war": [[31, 1, 1, "", "raw_env"]], "pettingzoo.atari.surround.surround": [[32, 1, 1, "", "raw_env"]], "pettingzoo.atari.tennis.tennis": [[33, 1, 1, "", "raw_env"]], "pettingzoo.atari.video_checkers.video_checkers": [[34, 1, 1, "", "raw_env"]], "pettingzoo.atari.volleyball_pong.volleyball_pong": [[35, 1, 1, "", "raw_env"]], "pettingzoo.atari.warlords.warlords": [[36, 1, 1, "", "raw_env"]], "pettingzoo.atari.wizard_of_wor.wizard_of_wor": [[37, 1, 1, "", "raw_env"]], "pettingzoo.butterfly.cooperative_pong.cooperative_pong": [[39, 1, 1, "", "env"], [39, 1, 1, "", "raw_env"]], "pettingzoo.butterfly.cooperative_pong.cooperative_pong.raw_env": [[39, 2, 1, "", "action_space"], [39, 2, 1, "", "close"], [39, 2, 1, "", "observation_space"], [39, 2, 1, "", "observe"], [39, 2, 1, "", "render"], [39, 2, 1, "", "reset"], [39, 2, 1, "", "state"], [39, 2, 1, "", "step"]], "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies": [[40, 1, 1, "", "env"], [40, 1, 1, "", "raw_env"]], "pettingzoo.butterfly.knights_archers_zombies.knights_archers_zombies.raw_env": [[40, 2, 1, "", "action_space"], [40, 2, 1, "", "close"], [40, 2, 1, "", "observation_space"], [40, 2, 1, "", "observe"], [40, 2, 1, "", "render"], [40, 2, 1, "", "reset"], [40, 2, 1, "", "state"], [40, 2, 1, "", "step"]], "pettingzoo.butterfly.pistonball.pistonball": [[41, 1, 1, "", "env"], [41, 1, 1, "", "raw_env"]], "pettingzoo.butterfly.pistonball.pistonball.raw_env": [[41, 2, 1, "", "action_space"], [41, 2, 1, "", "close"], [41, 2, 1, "", "observation_space"], [41, 2, 1, "", "observe"], [41, 2, 1, "", "render"], [41, 2, 1, "", "reset"], [41, 2, 1, "", "state"], [41, 2, 1, "", "step"]], "pettingzoo.classic.chess.chess": [[43, 1, 1, "", "env"], [43, 1, 1, "", "raw_env"]], "pettingzoo.classic.chess.chess.raw_env": [[43, 2, 1, "", "action_space"], [43, 2, 1, "", "close"], [43, 2, 1, "", "observation_space"], [43, 2, 1, "", "observe"], [43, 2, 1, "", "render"], [43, 2, 1, "", "reset"], [43, 2, 1, "", "step"]], "pettingzoo.classic.connect_four.connect_four": [[44, 1, 1, "", "env"], [44, 1, 1, "", "raw_env"]], "pettingzoo.classic.connect_four.connect_four.raw_env": [[44, 2, 1, "", "action_space"], [44, 2, 1, "", "close"], [44, 2, 1, "", "observation_space"], [44, 2, 1, "", "observe"], [44, 2, 1, "", "render"], [44, 2, 1, "", "reset"], [44, 2, 1, "", "step"]], "pettingzoo.classic.go.go": [[46, 1, 1, "", "env"], [46, 1, 1, "", "raw_env"]], "pettingzoo.classic.go.go.raw_env": [[46, 2, 1, "", "action_space"], [46, 2, 1, "", "close"], [46, 2, 1, "", "observation_space"], [46, 2, 1, "", "observe"], [46, 2, 1, "", "render"], [46, 2, 1, "", "reset"], [46, 2, 1, "", "step"]], "pettingzoo.classic.hanabi.hanabi": [[47, 1, 1, "", "env"], [47, 1, 1, "", "raw_env"]], "pettingzoo.classic.hanabi.hanabi.raw_env": [[47, 2, 1, "", "action_space"], [47, 2, 1, "", "close"], [47, 2, 1, "", "observation_space"], [47, 2, 1, "", "observe"], [47, 2, 1, "", "render"], [47, 2, 1, "", "reset"], [47, 2, 1, "", "step"]], "pettingzoo.classic.rlcard_envs.gin_rummy": [[45, 1, 1, "", "env"], [45, 1, 1, "", "raw_env"]], "pettingzoo.classic.rlcard_envs.gin_rummy.raw_env": [[45, 2, 1, "", "observe"], [45, 2, 1, "", "render"], [45, 2, 1, "", "step"]], "pettingzoo.classic.rlcard_envs.leduc_holdem": [[48, 1, 1, "", "env"], [48, 1, 1, "", "raw_env"]], "pettingzoo.classic.rlcard_envs.leduc_holdem.raw_env": [[48, 2, 1, "", "render"], [48, 2, 1, "", "step"]], "pettingzoo.classic.rlcard_envs.texas_holdem": [[50, 1, 1, "", "env"], [50, 1, 1, "", "raw_env"]], "pettingzoo.classic.rlcard_envs.texas_holdem.raw_env": [[50, 2, 1, "", "render"], [50, 2, 1, "", "step"]], "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit": [[51, 1, 1, "", "env"], [51, 1, 1, "", "raw_env"]], "pettingzoo.classic.rlcard_envs.texas_holdem_no_limit.raw_env": [[51, 2, 1, "", "render"], [51, 2, 1, "", "step"]], "pettingzoo.classic.rps.rps": [[49, 1, 1, "", "env"], [49, 1, 1, "", "raw_env"]], "pettingzoo.classic.rps.rps.raw_env": [[49, 2, 1, "", "action_space"], [49, 2, 1, "", "close"], [49, 2, 1, "", "observation_space"], [49, 2, 1, "", "observe"], [49, 2, 1, "", "render"], [49, 2, 1, "", "reset"], [49, 2, 1, "", "step"]], "pettingzoo.classic.tictactoe.tictactoe": [[52, 1, 1, "", "env"], [52, 1, 1, "", "raw_env"]], "pettingzoo.classic.tictactoe.tictactoe.raw_env": [[52, 2, 1, "", "action_space"], [52, 2, 1, "", "close"], [52, 2, 1, "", "observation_space"], [52, 2, 1, "", "observe"], [52, 2, 1, "", "render"], [52, 2, 1, "", "reset"], [52, 2, 1, "", "step"]], "pettingzoo.mpe.simple.simple": [[55, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_adversary.simple_adversary": [[56, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_crypto.simple_crypto": [[57, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_push.simple_push": [[58, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_reference.simple_reference": [[59, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_speaker_listener.simple_speaker_listener": [[60, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_spread.simple_spread": [[61, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_tag.simple_tag": [[62, 1, 1, "", "raw_env"]], "pettingzoo.mpe.simple_world_comm.simple_world_comm": [[63, 1, 1, "", "raw_env"]], "pettingzoo.sisl.multiwalker.multiwalker": [[65, 1, 1, "", "env"], [65, 1, 1, "", "raw_env"]], "pettingzoo.sisl.multiwalker.multiwalker.raw_env": [[65, 2, 1, "", "action_space"], [65, 2, 1, "", "close"], [65, 2, 1, "", "observation_space"], [65, 2, 1, "", "observe"], [65, 2, 1, "", "render"], [65, 2, 1, "", "reset"], [65, 2, 1, "", "state"], [65, 2, 1, "", "step"]], "pettingzoo.sisl.pursuit.pursuit": [[66, 1, 1, "", "env"], [66, 1, 1, "", "raw_env"]], "pettingzoo.sisl.pursuit.pursuit.raw_env": [[66, 2, 1, "", "action_space"], [66, 2, 1, "", "close"], [66, 2, 1, "", "observation_space"], [66, 2, 1, "", "observe"], [66, 2, 1, "", "render"], [66, 2, 1, "", "reset"], [66, 2, 1, "", "step"]], "pettingzoo.sisl.waterworld.waterworld": [[67, 1, 1, "", "env"], [67, 1, 1, "", "raw_env"]], "pettingzoo.sisl.waterworld.waterworld.raw_env": [[67, 2, 1, "", "action_space"], [67, 2, 1, "", "close"], [67, 2, 1, "", "observation_space"], [67, 2, 1, "", "observe"], [67, 2, 1, "", "render"], [67, 2, 1, "", "reset"], [67, 2, 1, "", "step"]], "pettingzoo.utils": [[4, 3, 0, "-", "agent_selector"], [4, 3, 0, "-", "average_total_reward"], [4, 3, 0, "-", "capture_stdout"], [6, 3, 0, "-", "conversions"], [4, 3, 0, "-", "save_observation"]], "pettingzoo.utils.agent_selector": [[4, 1, 1, "", "AgentSelector"], [4, 1, 1, "", "agent_selector"]], "pettingzoo.utils.agent_selector.AgentSelector": [[4, 2, 1, "", "is_first"], [4, 2, 1, "", "is_last"], [4, 2, 1, "", "next"], [4, 2, 1, "", "reinit"], [4, 2, 1, "", "reset"]], "pettingzoo.utils.average_total_reward": [[4, 0, 1, "", "average_total_reward"]], "pettingzoo.utils.capture_stdout": [[4, 1, 1, "", "capture_stdout"]], "pettingzoo.utils.conversions": [[6, 0, 1, "", "aec_to_parallel"], [6, 0, 1, "", "parallel_to_aec"]], "pettingzoo.utils.env": [[2, 1, 1, "", "AECEnv"], [3, 1, 1, "", "ParallelEnv"]], "pettingzoo.utils.env.AECEnv": [[2, 4, 1, "", "action_spaces"], [2, 4, 1, "", "agent_selection"], [2, 4, 1, "", "agents"], [2, 2, 1, "", "close"], [2, 4, 1, "", "infos"], [2, 4, 1, "", "max_num_agents"], [2, 4, 1, "", "num_agents"], [2, 4, 1, "", "observation_spaces"], [2, 2, 1, "", "observe"], [2, 4, 1, "", "possible_agents"], [2, 2, 1, "", "render"], [2, 2, 1, "", "reset"], [2, 4, 1, "", "rewards"], [2, 2, 1, "", "step"], [2, 4, 1, "", "terminations"], [2, 4, 1, "", "truncations"]], "pettingzoo.utils.env.ParallelEnv": [[3, 2, 1, "", "action_space"], [3, 4, 1, "", "action_spaces"], [3, 4, 1, "", "agents"], [3, 2, 1, "", "close"], [3, 4, 1, "", "max_num_agents"], [3, 4, 1, "", "num_agents"], [3, 2, 1, "", "observation_space"], [3, 4, 1, "", "observation_spaces"], [3, 4, 1, "", "possible_agents"], [3, 2, 1, "", "render"], [3, 2, 1, "", "reset"], [3, 2, 1, "", "state"], [3, 2, 1, "", "step"]], "pettingzoo.utils.env_logger": [[4, 1, 1, "", "EnvLogger"]], "pettingzoo.utils.env_logger.EnvLogger": [[4, 2, 1, "", "error_agent_iter_before_reset"], [4, 2, 1, "", "error_nan_action"], [4, 2, 1, "", "error_observe_before_reset"], [4, 2, 1, "", "error_possible_agents_attribute_missing"], [4, 2, 1, "", "error_render_before_reset"], [4, 2, 1, "", "error_state_before_reset"], [4, 2, 1, "", "error_step_before_reset"], [4, 2, 1, "", "flush"], [4, 2, 1, "", "get_logger"], [4, 4, 1, "", "mqueue"], [4, 2, 1, "", "suppress_output"], [4, 2, 1, "", "unsuppress_output"], [4, 2, 1, "", "warn_action_out_of_bound"], [4, 2, 1, "", "warn_on_illegal_move"], [4, 2, 1, "", "warn_step_after_terminated_truncated"]], "pettingzoo.utils.save_observation": [[4, 0, 1, "", "save_observation"]], "pettingzoo.utils.wrappers": [[6, 1, 1, "", "AssertOutOfBoundsWrapper"], [6, 1, 1, "", "BaseWrapper"], [6, 1, 1, "", "CaptureStdoutWrapper"], [6, 1, 1, "", "ClipOutOfBoundsWrapper"], [6, 1, 1, "", "OrderEnforcingWrapper"], [6, 1, 1, "", "TerminateIllegalWrapper"]]}, "objnames": {"0": ["py", "function", "Python function"], "1": ["py", "class", "Python class"], "2": ["py", "method", "Python method"], "3": ["py", "module", "Python module"], "4": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:function", "1": "py:class", "2": "py:method", "3": "py:module", "4": "py:attribute"}, "terms": {"": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 16, 17, 19, 20, 21, 22, 23, 25, 27, 29, 30, 34, 35, 39, 40, 41, 43, 44, 45, 46, 47, 48, 50, 51, 54, 63, 65, 67, 68, 70, 71, 72, 73, 74, 75, 76, 77, 79, 80, 86, 87, 88, 89, 90, 92, 93, 94], "0": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "000001": 71, "0001": [71, 72], "001": [12, 72, 73, 76], "01": [12, 66, 67, 70, 71, 72, 73, 75, 76], "015": 67, "02": [70, 71], "03": [70, 90, 91], "04": [70, 90], "04376": 42, "04908": 54, "05": [63, 70, 71, 94, 97], "06": [70, 87, 89, 90], "07": 70, "08": 70, "08932": 8, "09": 70, "09341": 13, "0th": 47, "1": [2, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "10": [9, 11, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 34, 39, 40, 46, 47, 54, 56, 59, 62, 65, 67, 71, 72, 73, 87, 89, 92, 93, 94, 95, 97], "100": [4, 10, 15, 26, 30, 39, 41, 45, 47, 51, 65, 71, 72, 73, 79, 80, 86, 90, 92, 93], "1000": [11, 37, 45, 48, 50, 51, 52, 94, 97], "10000": [47, 72], "100000": [13, 71, 73, 87], "10000000": 87, "10000000000": 4, "1002": 70, "1003": 70, "1004": 70, "1010": 70, "1011": 70, "1012": 70, "1013": 70, "1014": 70, "1015": 70, "1016": 70, "1017": 70, "1018": 70, "1019": 70, "1020": 70, "1024": [13, 70], "1026": 70, "1029": 70, "1031": 70, "1033": 70, "1034": 70, "1036": 70, "1037": 70, "1038": 70, "1041": 70, "1045": 70, "1046": 70, "1047": 70, "1051": 70, "1054": 70, "1055": 70, "1057": 70, "1058": 70, "1071": 70, "1074": 70, "1077": 70, "1080": 70, "1082": 70, "1083": 70, "1084": 70, "1086": 70, "1087": 70, "1088": 70, "1089": 70, "109": 45, "1090": 70, "1092": 70, "1095": 70, "1096": 70, "1097": 70, "10_000": [90, 92, 93], "10k": 90, "10x": 90, "11": [9, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 39, 43, 45, 46, 47, 48, 50, 51, 60, 65, 75, 76], "110": 45, "1103": 70, "1105": 70, "1107": 70, "111": 43, "1110": 70, "11111": 47, "1112": 70, "1116": 70, "1120": 70, "1124": 70, "1128": 70, "1129": 70, "1130": 70, "1133": 70, "1134": 70, "1135": 70, "1137": 70, "1139": 70, "1140": 70, "1144": 70, "1148": 70, "1149": 70, "1152": 70, "1153": 70, "1154": 70, "1155": 70, "11_12": [87, 89], "12": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 39, 43, 45, 47, 50, 51, 65], "120": [18, 41, 71, 72], "1200": 15, "12000": 75, "124": 47, "125": [12, 41, 47, 76, 89], "128": [12, 71, 72, 73, 75, 76, 89, 94, 97], "1280": 40, "13": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 43, 45, 47, 50, 51, 65, 71, 72, 73, 75, 76, 87, 89], "14": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 39, 40, 45, 47, 48, 50, 51, 60, 62, 65, 66], "15": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 47, 49, 65, 71, 72, 73], "150": 71, "16": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 40, 47, 62, 66, 75], "160": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "1626": 94, "16x16": 40, "17": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 40, 47], "1703": 54, "174": 47, "175": 47, "179": 47, "18": [9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 43, 45, 47, 61, 72, 73, 79, 80], "180": 47, "184": 47, "185": 47, "189": 47, "19": [43, 45, 46, 47, 48, 58, 87, 89], "190": 47, "1910": 42, "192": 63, "195": 47, "196_608": 93, "199": 47, "1_000_000": 81, "1d": 8, "1e": [12, 65, 71, 75, 76, 90, 93, 94, 97], "1e10": 87, "1st": [43, 46, 47], "2": [7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 57, 58, 59, 60, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "20": [40, 41, 43, 47, 48, 57, 63, 67, 71, 72, 73, 86, 89, 90], "200": [12, 30, 37, 47, 65, 71, 76, 87], "20000": [25, 94], "200000": 71, "2000000": 75, "2008": 8, "2009": 13, "2013": 13, "2017": [54, 64], "2018": [8, 13], "2019": 42, "2020": [8, 13, 70], "2021": 70, "2022": [2, 7, 70, 91], "2023": 70, "2024": 70, "207": 47, "208": 47, "20_000": 97, "20_480": 90, "20k": 90, "21": [48, 94, 95, 97], "210": [14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 32, 33, 34, 35, 36, 37, 47], "211": 47, "22": [48, 67, 71, 72, 73, 94, 95, 97], "23": [20, 43, 47, 65, 71, 72, 73, 94, 95, 97], "24": [47, 65, 71, 72, 73, 75, 76, 87, 89, 90, 92, 93], "242": [67, 93], "25": [9, 13, 45, 47, 50, 51, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 70, 73, 89, 91], "250": [7, 26, 31], "2500": 37, "253": 13, "255": [12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 71, 72, 73, 75, 76], "256": [16, 71, 75, 92, 93], "26": [45, 50, 51, 65, 70], "260": 47, "261": 47, "262": 47, "263": 47, "266": 47, "267": 47, "268": 47, "269": 47, "27": [45, 50, 51, 58, 65, 70], "273": 47, "274": 47, "278": 47, "279": [13, 47], "28": [56, 59, 63, 65, 70, 71, 72, 73], "280": [39, 47], "281": 47, "282": 47, "283": 47, "29": [65, 70], "2d": [8, 46, 67], "2e": 89, "2f": [72, 73], "2n": 46, "2nd": [46, 47], "2x3": 71, "3": [8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 45, 46, 47, 48, 49, 50, 51, 52, 56, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 92, 93, 94, 95, 97], "30": [30, 65, 66, 67, 87, 89, 90], "300": 65, "3000": 24, "30000": 71, "307": 47, "308": 47, "31": [45, 65, 71, 72, 73], "3136": 89, "32": [12, 45, 72, 73, 75, 76, 89], "320": [94, 97], "32999": 70, "33": 48, "34": 63, "342": 47, "343": 47, "34696": 70, "35": 48, "36": 48, "362": 46, "377": 47, "378": 47, "38": [45, 50, 51], "39": [45, 50, 51], "3d": 8, "3rd": [47, 70], "3x3": 52, "4": [8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 57, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 94, 95, 97], "40": [45, 50, 51, 90], "400": 71, "4000": 96, "40k": 90, "40x40": 40, "412": 47, "413": 47, "42": [2, 3, 4, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 69], "44": 45, "445": 47, "447": 47, "45": [45, 71], "457": 41, "4672": 43, "47": 13, "480": 39, "482": 47, "483": 47, "49": 47, "4th": 47, "4x": 74, "4x2x2": 71, "4x2x3": 71, "4x2x3x2": 71, "5": [11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 89, 90, 92, 94, 95, 97], "50": [7, 43, 47, 59, 62, 63, 70, 71, 87, 89, 90, 94, 97], "500": [65, 66, 67, 71, 72, 73], "50000": [87, 89], "5000000": 89, "51": [45, 50, 51, 71], "512": [12, 40, 75, 76, 89], "512px": 92, "512x512": 40, "517": 47, "518": 47, "52": [45, 50, 51], "523": 13, "53": [50, 51], "54": [51, 61], "552": 47, "553": 47, "56": [43, 50], "560": [39, 41], "562": 13, "57": [45, 50, 87, 89], "58": [45, 50], "587": 47, "588": 47, "59": 45, "5cat": 70, "5e": 75, "5th": 43, "5x52": 45, "6": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 40, 41, 43, 44, 45, 46, 47, 48, 49, 52, 63, 65, 67, 71, 74, 75, 79, 80, 86, 94, 95, 97], "6000": [71, 72, 73], "600000": 71, "61": [13, 50], "612": 71, "62": [50, 62], "621": 70, "622": 47, "63": [9, 50], "64": [12, 71, 72, 75, 76, 89, 94, 97], "65": [71, 72, 73], "657": 47, "658": 47, "66": [50, 64], "663": 47, "67": 50, "68": 50, "6x7": 44, "6x7x2": 71, "7": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37, 43, 44, 45, 46, 47, 48, 49, 52, 65, 66, 67, 71, 75, 79, 80, 87, 89, 94], "70": [7, 45], "700": 71, "71": [45, 50], "72": 50, "720": 40, "73": 43, "731": 70, "732": 70, "734": 70, "737": 70, "738": 70, "739": 70, "74": 47, "741": 70, "743": 70, "747": 70, "748": 70, "749": 70, "75": [41, 47, 65, 67, 89, 90], "750": 70, "76": 90, "763": 70, "767": 70, "776": 70, "777": 70, "779": 70, "780": 70, "781": 70, "782": 70, "787": 70, "788": 70, "789": 70, "790": 70, "796": 70, "798": 70, "7e": 90, "7x7": 79, "8": [9, 12, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37, 43, 44, 45, 46, 47, 48, 50, 51, 52, 56, 57, 58, 59, 65, 66, 67, 71, 72, 75, 76, 86, 89, 92, 93, 94, 95, 97], "80": 90, "800": [25, 41, 43, 46, 49, 70], "8000": 75, "802": 70, "804": 70, "807": 70, "808": 70, "809": 70, "810": 70, "814": 70, "817": 70, "818": 70, "8192": 90, "81_920": 92, "821": 70, "822": 70, "823": 70, "825": 70, "829": 70, "83": [45, 64], "831": 70, "832": 70, "833": 70, "835": 70, "836": 70, "837": 70, "838": 70, "839": 70, "84": [13, 45, 72, 75, 89, 92], "840": 70, "841": 70, "842": 70, "843": 70, "844": 70, "845": 70, "846": 70, "847": 70, "848": 70, "84px": 92, "850": 70, "852": 70, "853": 70, "854": 70, "855": 70, "856": 70, "857": 70, "858": 70, "859": 70, "86": 90, "865": 70, "867": 70, "869": 70, "870": 70, "872": 70, "874": 70, "875": 70, "876": 70, "879": 70, "880": [41, 70], "882": 70, "883": 70, "886": 70, "890": 70, "891": 70, "894": 70, "897": 70, "8th": 43, "8x8": 43, "8x8x73": 43, "9": [9, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 37, 39, 43, 44, 46, 47, 49, 62, 63, 65, 71, 72, 73, 75, 76, 87, 89, 92, 93, 94, 97], "900": [9, 39, 40, 72], "903": 70, "904": 70, "906": 70, "907": 70, "908": 70, "942": 70, "948": 70, "95": [72, 73, 75], "950": 70, "953": 70, "954": 70, "96": 45, "960": [39, 70], "964": 70, "968": 70, "97": 45, "970": 70, "972": 70, "975": 70, "979": 70, "980": 70, "984": 70, "985": 70, "986": 70, "987": 70, "99": [12, 71, 75, 76, 89], "990": 70, "991": 70, "992": 70, "993": 70, "994": 70, "995": [72, 73], "997": 70, "998": 70, "999": 70, "9998": 71, "A": [2, 3, 5, 6, 9, 10, 14, 21, 25, 26, 32, 33, 34, 40, 41, 42, 43, 44, 45, 47, 50, 51, 66, 68, 71, 77, 78, 92], "And": [3, 10, 79, 80], "As": [11, 38, 40, 47, 48, 64, 70, 71], "At": [4, 8, 10, 44, 45, 47, 48, 51, 61, 71, 78], "But": [14, 32, 54], "By": [2, 4, 47, 62, 63, 65, 66, 71], "For": [1, 2, 3, 7, 8, 10, 11, 13, 40, 41, 43, 45, 46, 47, 52, 57, 65, 67, 70, 71, 72, 73, 74, 79, 80, 83, 86, 90, 91, 92, 93], "If": [2, 3, 4, 6, 7, 8, 9, 10, 11, 13, 14, 17, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 44, 45, 47, 49, 52, 54, 64, 65, 67, 68, 71, 72, 73, 75, 76, 79, 80, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "In": [2, 3, 6, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 40, 41, 42, 43, 51, 54, 55, 56, 57, 63, 65, 68, 70, 71, 80, 90], "It": [3, 4, 9, 10, 39, 43, 65, 68, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97], "Its": 26, "NOT": 75, "No": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 70, 95], "Not": [9, 73], "Of": 13, "On": 23, "One": [43, 47, 56, 85], "THE": [12, 76], "TO": 75, "That": 47, "The": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 15, 16, 17, 18, 20, 25, 26, 27, 30, 31, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 58, 59, 61, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 75, 76, 77, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "Their": 9, "Then": [75, 91], "There": [9, 13, 25, 26, 39, 40, 45, 47, 70, 85], "These": [2, 3, 9, 10, 42, 43, 47, 54, 67, 68, 70, 74, 79, 80, 83, 85, 88, 90, 91, 96], "To": [1, 2, 6, 7, 8, 9, 10, 11, 13, 22, 27, 32, 34, 38, 39, 42, 54, 64, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "Will": [94, 95, 97], "_": [8, 12, 71, 72, 73, 75, 76, 87, 90, 92, 93, 94, 97], "__": 75, "_____": 86, "_________": 52, "__doc__": 86, "__file__": 75, "__future__": [92, 93], "__init__": [8, 10, 12, 71, 75, 76, 78, 79, 80, 86, 87, 89], "__main__": [12, 71, 72, 73, 75, 76, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "__name__": [12, 71, 72, 73, 75, 76, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "_accumulate_reward": 10, "_act": 86, "_action_emb": 87, "_action_spac": 10, "_agent_selector": 10, "_build": 1, "_clear_reward": 10, "_cumulative_reward": [10, 90], "_elit": 71, "_get_ag": 97, "_get_env": 97, "_label_with_episode_numb": [71, 72, 73], "_layer_init": [12, 76], "_observation_spac": 10, "_opp": 71, "_script": 1, "_value_out": 89, "_was_dead_step": 10, "ab": [12, 75, 76], "abbeel": 54, "abil": [30, 71], "abl": [9, 11, 16, 21, 26, 35], "about": [1, 3, 6, 41, 47, 54, 65, 67, 70, 71, 74, 78, 79, 85, 90], "abov": [9, 24, 26, 35, 41, 78, 87], "absolut": [40, 54, 81], "ac": 45, "acceler": [31, 67, 70], "accept": [2, 8, 9, 10, 16, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 70, 90], "access": [2, 6, 9, 12, 54, 70, 76, 90, 91, 97], "accord": [2, 71, 72, 73, 86], "accordingli": 41, "account": [10, 31, 70, 71], "accumul": [8, 10, 43], "accur": 74, "achiev": [38, 41, 54, 65, 71], "acpc": 51, "across": [4, 30, 41, 70, 77], "act": [2, 8, 9, 10, 41, 49, 67, 71, 72, 73, 78, 86, 90, 92, 93], "act_messag": 86, "act_spac": [87, 89], "action": [3, 4, 6, 7, 8, 9, 10, 12, 13, 38, 39, 40, 41, 42, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 69, 70, 71, 72, 73, 75, 76, 78, 79, 83, 85, 87, 89, 91, 94], "action_": 71, "action_6": 49, "action_7": 49, "action_dim": [71, 72, 73], "action_embed_model": 87, "action_logit": 87, "action_mask": [2, 7, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 71, 80, 86, 87, 90], "action_mask_fn": 90, "action_masking_ag": 86, "action_pars": 86, "action_shap": [94, 97], "action_spac": [2, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 90, 92, 94, 97], "actiondict": 70, "actionmask": 90, "actionmaskag": 86, "actiontyp": [2, 3, 6], "activ": [25, 41, 70, 71, 72, 73, 92], "actor": [9, 12, 54, 68, 71, 72, 73, 75, 76], "actual": [11, 70, 86], "ad": [2, 3, 8, 9, 11, 39, 41, 49, 65, 66, 67, 70, 71, 81], "adam": [12, 71, 75, 76, 94, 97], "adapt": [70, 75, 91], "add": [8, 9, 10, 12, 39, 40, 49, 57, 66, 67, 70, 76, 92, 94], "add_argu": [75, 87, 89, 94], "add_scalar": 75, "add_text": [75, 94], "addit": [3, 4, 8, 11, 19, 20, 35, 37, 41, 45, 48, 49, 51, 65, 70], "addition": [8, 26, 41, 64], "address": 70, "adopt": [43, 44, 45, 46, 47, 48, 49, 50, 51, 52], "adv": 75, "advanc": [31, 47, 77], "advantaeg": [12, 76], "advantag": [12, 75, 76], "adversari": [15, 16, 17, 18, 54, 57, 58, 62, 63], "adversary_0": [56, 58, 62, 63], "adversary_1": [62, 63], "adversary_2": 62, "adversary_3": 63, "aec": [3, 4, 5, 8, 9, 10, 69, 70, 83, 87, 88, 90, 91, 92, 93], "aec_env": 6, "aec_rp": 10, "aec_to_parallel": [6, 70], "aec_to_parallel_wrapp": 6, "aec_wrapper_fn": 70, "aecenv": [4, 6, 10], "affect": [35, 47, 54], "after": [2, 4, 9, 10, 11, 16, 17, 18, 20, 25, 27, 34, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 66, 67, 70, 79, 80, 86, 87, 89, 90, 92, 93], "again": [10, 34, 71], "against": [37, 68, 71, 90, 92], "agent": [2, 3, 6, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 74, 75, 76, 77, 78, 79, 80, 88, 90, 91, 92, 93, 94, 95, 96], "agent1": 10, "agent2": 10, "agent_0": [55, 56, 58, 59, 61, 62, 63], "agent_1": [10, 56, 59, 61, 63], "agent_2": [10, 61], "agent_3": 10, "agent_id": [72, 73, 87, 94], "agent_indicator_v0": [8, 75], "agent_it": [2, 4, 6, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 86, 87, 89, 90, 92, 93], "agent_learn": [94, 97], "agent_mask": [72, 73], "agent_nam": [47, 86], "agent_name_map": 10, "agent_oppon": [94, 97], "agent_ord": 4, "agent_reward": [72, 73], "agent_select": [2, 4, 6, 9, 10, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 79, 80, 90], "agent_selector": 4, "agent_three_count": 71, "agent_warm_up": 71, "agentid": [2, 3, 4, 6, 70], "agentselector": [4, 10], "agilerl": 70, "agilerl_dqn_curriculum": 71, "ai": 43, "aim": [46, 71], "al": [8, 13], "alg_nam": 87, "algo": [12, 71, 72, 73, 75, 76], "algorithm": [2, 8, 12, 68, 71, 72, 73, 74, 75, 76, 77, 87, 88, 89, 91, 96], "alic": 57, "alice_0": 57, "alices_comm": 57, "alien": 30, "all": [2, 3, 4, 6, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 59, 61, 63, 64, 65, 66, 67, 70, 71, 78, 79, 85, 86, 90, 91], "all_ag": 4, "all_environ": 70, "all_landmark_rel_posit": [58, 59, 60], "all_modul": 70, "alli": 66, "alloc": [6, 10, 65, 67], "allow": [1, 2, 3, 4, 5, 7, 8, 9, 10, 11, 13, 22, 25, 47, 49, 52, 54, 70, 71, 72, 73, 74, 77, 79, 80, 90, 91, 92], "alogorithm": [72, 73], "along": [4, 8, 39, 43, 78], "alpha": 71, "alphachesszero": 43, "alphazero": [43, 46], "alreadi": [9, 10, 26, 66, 80], "also": [2, 4, 8, 9, 10, 14, 15, 18, 22, 27, 28, 29, 30, 33, 34, 35, 40, 47, 54, 62, 65, 66, 67, 68, 70, 71, 86, 90], "alter": 71, "altern": [3, 22, 71], "alternating_control": 30, "although": 71, "alwai": [39, 40, 41, 43, 54, 59, 61, 70, 71, 90], "among": [65, 66, 67, 86], "amount": [9, 41, 51], "an": [2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 63, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 79, 80, 85, 86, 88, 90, 91, 92, 93, 96], "analog": [8, 11], "analyt": 70, "ananth": 8, "andrea": 70, "andrewrwilliam": 70, "andrewtanj": 70, "angl": [39, 40, 65], "angle_nois": 65, "angri": 41, "angular": [41, 65], "ani": [2, 4, 6, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 63, 65, 66, 67, 70, 71, 72, 73, 75, 76, 78, 79, 80, 81, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "anneal": [75, 87], "anneal_lr": 75, "annoi": 70, "annot": [92, 93], "announc": 70, "anoth": [8, 9, 47, 48, 51, 54, 81, 90], "ansi": [2, 3, 6, 9, 10, 11, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67], "answer": 85, "anyon": 83, "anyth": 8, "anywai": 30, "anywher": 66, "apart": 54, "api": [4, 5, 6, 10, 12, 69, 70, 74, 76, 79, 80, 90, 93, 96], "api_test": [2, 11], "apologi": 70, "appear": [20, 41], "append": [8, 9, 47, 71, 72, 73, 86, 89, 90], "append_imag": 89, "appli": [2, 5, 6, 8, 10, 41, 59, 61, 65, 66, 67, 71, 92], "applic": [49, 73, 85, 86, 88], "approach": [13, 43], "appropri": [3, 15, 39, 65], "approx": [12, 75, 76], "approx_kl": [12, 75, 76], "ar": [2, 3, 4, 6, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 73, 75, 76, 78, 79, 80, 83, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "arang": [12, 71, 75, 76], "arbitrari": [2, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70], "arc": 40, "arcad": [8, 13, 34, 68], "arch": [71, 72, 73], "archea": 67, "archer": [2, 4, 38, 70, 91], "archer_0": [40, 92], "archer_1": 40, "architectur": [71, 72, 73], "area": [8, 22, 29, 33, 35, 54, 62, 71, 85], "arg": [4, 65, 66, 67, 70, 75, 87, 89, 94], "argmin": 71, "argpars": [75, 87, 89, 94], "argument": [8, 9, 10, 11, 12, 13, 16, 38, 42, 54, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 94], "argumentpars": [75, 87, 89, 94], "arial": 71, "around": [3, 6, 10, 15, 16, 17, 19, 20, 23, 24, 31, 40, 54, 65, 66, 70, 71, 93], "arrai": [2, 3, 8, 9, 10, 12, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 71, 76, 86], "arrow": [39, 40, 66], "art": [70, 91], "articl": [8, 13, 42, 54], "artifact": 70, "artifici": 13, "arxiv": [8, 13, 42, 54], "as_vector": 47, "ascii": 70, "ask": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "aspect": [9, 30, 32, 37], "assert": [6, 11, 70, 75, 90], "assertoutofbound": 70, "assertoutofboundswrapp": [6, 10], "assess": 7, "assign": [8, 71, 72, 73, 90], "assist": 85, "assort": 4, "assum": [81, 90], "assumpt": [6, 90], "astyp": 71, "atari": [8, 9, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 70, 71, 72, 73, 74, 75, 76, 77], "attack": [37, 40], "attempt": [65, 67, 86], "attr": 70, "attribut": [4, 6, 9, 10, 70, 79, 80], "attributeerror": 6, "author": [7, 8, 12, 13, 42, 54, 64, 71, 72, 73, 75, 76, 87, 89, 90, 92, 93, 94, 95, 97], "auto": [27, 68], "auto_rom_install_path": 13, "autobuild": 1, "autodepr": 70, "autom": 70, "automat": [1, 2, 9, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 65, 66, 67, 70, 90], "autonom": [64, 68], "autorom": [13, 75], "avail": [8, 43, 44, 45, 46, 47, 48, 50, 51, 52, 71, 87], "averag": [20, 56, 59, 65, 67, 70, 93], "average_total_reward": 4, "avg": [72, 73, 92, 93], "avg_reward": [92, 93], "avg_reward_per_ag": 92, "aviv": 54, "avoid": [19, 20, 30, 32, 61, 67, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "awai": [10, 29, 35, 58], "awar": [24, 37], "award": [44, 45, 47], "awhil": 27, "axelbr": 70, "axi": [12, 71, 76], "b": [1, 8, 43, 71, 72, 75, 89, 92], "b_action": [12, 75, 76], "b_advantag": [12, 75, 76], "b_ind": 75, "b_index": [12, 76], "b_logprob": [12, 75, 76], "b_ob": [12, 75, 76], "b_return": [12, 75, 76], "b_valu": [12, 75, 76], "back": [6, 10, 17, 21, 25, 30, 43, 46, 70], "backend": 75, "backgammon": [7, 70], "backup_polici": 4, "backward": [12, 40, 75, 76], "bad": [27, 70], "badg": 70, "balanc": [41, 46, 49, 71], "ball": [14, 22, 28, 29, 33, 35, 36, 39, 41, 63, 70], "ball_elast": [41, 89], "ball_frict": [41, 89], "ball_mass": [41, 89], "ball_spe": [9, 39], "bamboofungu": 70, "bare": 11, "barrier": 67, "base": [2, 3, 4, 6, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 41, 42, 44, 47, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 67, 68, 69, 70, 71, 72, 86], "base_class": [75, 92, 93], "base_env": 9, "baselin": [4, 8, 13], "baselines3": [70, 90, 92, 93], "basenam": 75, "baseparallelwrap": 70, "baseparallelwrapp": [6, 70], "basepolici": [94, 97], "basewrapp": [6, 90], "basic": [12, 26, 76, 79, 96], "basketbal": [13, 18], "basketball_pong": [14, 70], "basketball_pong_v3": [14, 28], "batch": [12, 71, 72, 73, 75, 76, 91, 94, 97], "batch_index": [12, 76], "batch_ob": 87, "batch_siz": [12, 71, 72, 73, 75, 76, 92, 93, 94, 97], "batched_act": 87, "batchifi": [12, 76], "batchify_ob": [12, 76], "battl": [21, 22, 29, 35, 37], "battlefield": 70, "beat": [49, 71], "becaus": [9, 10, 18, 20, 27, 47, 86, 90], "becom": [8, 9, 71], "been": [8, 9, 13, 26, 30, 43, 44, 47, 52, 66, 67, 70, 75, 90, 92, 93], "befor": [2, 4, 6, 8, 9, 10, 26, 27, 40, 42, 43, 70, 71, 78], "before_sleep": 86, "begin": [2, 18, 47, 48, 51, 57], "beginn": 70, "behav": 90, "behavior": [2, 6, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 41, 70], "behind": 32, "being": [8, 9, 16, 35, 40, 47, 49, 54, 62, 63, 66, 67, 70, 80], "bellemar": 13, "bellemare13arcad": 13, "belong": [29, 67], "below": [6, 10, 11, 13, 24, 25, 41, 43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 71, 72, 73, 75, 76, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "benchmark": [64, 74, 77], "benefit": 37, "benjamin": [8, 13], "bertranddecost": 70, "best": [48, 71, 81], "best_act": 71, "best_fit": 71, "bet": [48, 51], "beta": [71, 85], "better": [8, 70, 71, 90], "between": [2, 3, 5, 6, 8, 10, 22, 23, 27, 30, 37, 40, 41, 54, 70, 71, 85, 86, 90, 96], "betwenen": 95, "beyond": [54, 65, 67, 85], "bi": 16, "bia": [12, 73, 75, 76], "bias": [71, 75, 77], "bias_const": [12, 75, 76], "biggest": 8, "billiard": 17, "billiard_hit": 17, "bin": 13, "binari": [42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70], "biped": 65, "bird": 41, "bishop": 43, "bit": [13, 47, 57], "bitter": 71, "bkrl": 70, "black": [8, 13, 40, 43, 46, 62, 67, 70, 92], "black_0": 46, "black_death": 92, "black_death_v2": 8, "black_death_v3": 92, "blank": [71, 92], "blast": 17, "blizzard": 68, "blob": 75, "block": [26, 54, 62, 71, 72, 73, 80], "block_vert_coef": 71, "blockad": 26, "blog": [12, 75, 76, 91], "blue": [47, 63, 66], "board": [7, 22, 27, 43, 46, 52, 68, 70, 71, 80, 90], "board_histori": 43, "board_siz": [46, 90], "board_valu": 71, "boast": 96, "bob": [54, 57], "bob_0": 57, "bodi": 40, "bolundai0216": 70, "bomb": [21, 30], "bomberman": 68, "bonu": [25, 30], "booktitl": 64, "bool": [2, 3, 4, 45, 47, 71, 75], "boolean": 50, "bootstrap": [12, 75, 76], "border": [40, 41, 54], "bot": 68, "both": [4, 5, 6, 8, 10, 20, 21, 23, 25, 27, 32, 37, 41, 43, 44, 45, 46, 47, 49, 51, 52, 54, 57, 59, 67, 70, 74, 79, 83, 91], "both_dir": 71, "bottom": [40, 44, 54, 79, 81], "bounc": [17, 41], "bounce_random": [9, 39], "bound": [6, 8, 39, 62, 63], "bowl": 13, "box": [2, 8, 13, 55, 56, 57, 58, 59, 60, 61, 62, 63, 66, 87], "boxing_v2": 15, "bracket": 70, "break": [2, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 40, 70, 71, 72, 73, 75, 76, 90, 92, 93], "breakdown": 40, "bro": 13, "broadcast": 54, "broken": 70, "brought": 70, "buffer": [71, 72, 73, 94], "buffer_s": 94, "buffer_warm_up": 71, "bug": [2, 11, 39, 40, 43, 44, 45, 46, 47, 48, 50, 51, 52, 64, 65, 66, 67, 70], "bugfix": 70, "buggi": 70, "build": 96, "built": 81, "bullet": [16, 17, 31, 37, 68], "bump": [40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 70, 80], "bunch": 70, "butterfli": [3, 4, 6, 9, 10, 11, 12, 39, 40, 41, 69, 70, 75, 76, 87, 89, 92], "button": 34, "c": [13, 43, 70, 71, 72, 73], "cach": [10, 11, 70, 79, 80], "cake": 39, "cake_paddl": [9, 39], "calcul": [4, 12, 47, 70, 71, 75, 76], "call": [2, 4, 6, 8, 9, 10, 11, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 79, 80, 85, 90], "callabl": 97, "callback": [94, 97], "can": [1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 57, 60, 61, 63, 64, 65, 66, 67, 68, 69, 70, 75, 79, 80, 81, 85, 86, 90, 91, 92, 93, 94, 97], "cannot": [2, 3, 4, 9, 14, 27, 40, 44, 47, 54, 57, 60, 68, 70], "cao": 42, "cap": 65, "capabililti": 70, "capabl": [43, 69], "captur": [6, 13, 26, 27, 34, 43, 46, 67, 75], "capture_stdout": 4, "capture_video": 75, "capturestdoutwrapp": [4, 6, 10], "card": [42, 45, 47, 48, 50, 51, 68], "card_knowledg": 47, "cardin": [54, 79], "care": [24, 26, 37], "carefulli": 10, "carla": 70, "carri": 65, "cartesian": [59, 63], "case": [2, 6, 9, 65, 70, 78], "cast": [70, 90], "castl": 43, "catch": [66, 70, 79], "catch_reward": 66, "categor": [12, 75, 76], "cathedr": 70, "caught": [2, 66], "caus": [2, 65, 70, 90], "cd": 1, "cell": [44, 52, 80], "center": [39, 40, 66], "central": [3, 39, 65, 72], "certain": [8, 9, 54, 70, 71, 80], "cff": 70, "challeng": [38, 39, 68], "champion": 71, "chanc": [2, 8], "chang": [1, 2, 3, 4, 6, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 46, 47, 65, 66, 67, 70, 71, 75, 79, 80, 87, 90], "changeabl": 9, "changelog": 70, "channel": [8, 12, 43, 54, 57, 66, 70, 71, 72, 73, 76, 92], "channel_s": [71, 72], "channels_last": [72, 73], "chart": 75, "chase": 63, "chat_model": 86, "chatopenai": 86, "check": [4, 6, 11, 21, 43, 48, 50, 51, 57, 70, 71, 72, 73, 74, 75, 79, 80], "check_for_winn": 70, "check_three_in_row": 71, "check_vertical_win": 71, "check_winn": 71, "checker": [13, 70], "checkpoint": [71, 87, 89], "checkpoint_000050": [87, 89], "checkpoint_freq": [87, 89], "checkpoint_path": [87, 89], "chess": [1, 2, 7, 42, 68, 70, 71, 80, 88, 90], "chess_v5": 70, "chess_v6": [2, 43, 70, 90], "chicken": 68, "chines": 46, "chip": [48, 50, 51], "chipmunk": 41, "choic": [18, 49, 71, 94], "choos": [2, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 49, 54, 67, 71, 85], "chosen": [4, 8, 65, 86], "chrisyeh96": 70, "ci": [70, 87, 89, 90], "cibeah": 70, "circl": [54, 62], "circular": 54, "circumst": 9, "citat": 70, "cite": [7, 8, 42, 45, 48, 51, 54, 64], "cl": 86, "clamp": [12, 75, 76, 87], "class": [2, 3, 4, 6, 8, 10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 75, 76, 78, 79, 80, 86, 87, 89, 90], "classic": [1, 2, 3, 6, 17, 27, 28, 30, 34, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 68, 70, 71, 72, 73, 86, 87, 89, 94, 95, 97], "classmethod": 86, "clean": [12, 54, 70, 76, 91], "cleanrl": [12, 70, 94, 97], "cleanup": [40, 70], "clear": [30, 37, 70], "cli": [70, 75, 77, 96], "clip": [6, 8, 12, 75, 76], "clip_act": 89, "clip_actions_v0": 8, "clip_coef": [12, 75, 76], "clip_frac": [12, 76], "clip_grad_norm_": 75, "clip_param": 89, "clip_reward_v0": [8, 72, 75], "clip_vloss": 75, "clipfrac": 75, "clipoutofboundswrapp": [6, 10], "clock": [10, 43, 79, 80], "clockwis": 40, "clone": [71, 75], "close": [2, 3, 6, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 70, 71, 72, 73, 75, 86, 89, 90, 92, 93], "closer": [2, 59], "closest": [56, 61], "club": [45, 50, 51], "cnn": [71, 72, 91, 92, 93], "cnnmodelv2": 89, "cnnpolici": 92, "co": [70, 74], "code": [1, 2, 6, 9, 10, 12, 40, 54, 64, 65, 70, 91, 96], "codebas": 54, "codeblock": 70, "coef": 75, "coeffici": [71, 75], "coin": 25, "col": 71, "collabor": 25, "collect": [8, 10, 12, 25, 66, 71, 72, 73, 76, 85, 86, 94, 95, 97], "collector": [94, 95, 97], "collid": [40, 61, 67], "collis": [39, 61, 62, 63, 65, 70], "color": [5, 8, 27, 43, 47, 54, 56, 59, 71, 92], "color_reduction_v0": [8, 12, 72, 75, 76, 89, 92], "column": [41, 43, 44, 45, 70, 71], "column_count": 71, "column_piec": 71, "com": [7, 12, 64, 70, 71, 72, 73, 75, 76, 87, 89, 90, 92, 93, 94, 95, 97], "combat": [13, 31], "combat_jet_v1": 16, "combat_plan": 16, "combat_plane_v2": 16, "combat_tank": 17, "combat_tank_v2": 17, "combat_tank_v3": 17, "combin": [6, 18, 41, 43, 45, 54, 70], "combined_arm": 70, "come": [8, 32], "comm": 54, "command": 1, "comment": [10, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "commit": 70, "common": [4, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 47, 49, 70, 75, 85, 90, 94, 97], "commonli": [5, 7, 9], "commun": [42, 47, 48, 50, 51, 54, 57, 59, 60, 61, 63], "companion": [8, 10], "compar": [64, 73, 74], "comparison": [3, 70], "compass": 43, "compat": [5, 13, 47, 68, 70, 90], "compens": 46, "compet": [7, 71], "competit": [7, 13, 14, 23, 26, 28, 30, 31, 32, 33, 37, 42, 54, 67, 71, 72, 74], "complet": [11, 47, 66, 70, 81, 94], "complex": [10, 16, 47, 68, 72, 85], "compli": 70, "complianc": 11, "complic": [71, 78], "compon": [71, 72, 73], "compos": [54, 65, 85], "composit": 54, "comprehens": 96, "compris": 13, "comput": [2, 9, 12, 13, 39, 40, 45, 46, 67, 71, 76, 87, 90], "computation": 8, "compute_actions_from_input_dict": 87, "compute_single_act": 89, "concat_vec_envs_v1": [75, 92, 93], "concaten": [8, 71], "concatvecenv": 70, "concept": [71, 78], "condit": [2, 9, 47, 70, 71, 79, 80], "confer": 64, "config": [70, 75, 87, 89], "configur": [9, 38, 47, 71, 72, 73], "confin": 68, "conflict": [68, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "confus": [26, 70], "connect": [2, 10, 39, 40, 41, 42, 43, 46, 47, 49, 52, 65, 66, 67, 70, 74, 88, 91], "connect_four": [44, 71, 90], "connect_four_": 71, "connect_four_v3": [42, 44, 71, 90], "consequ": 91, "conserv": 32, "consid": [2, 9, 41, 66, 71], "consider": 71, "consist": [11, 43, 54, 70, 79], "consol": [8, 13, 47], "const": 75, "constant": [8, 10, 11, 40, 79, 80, 92], "constant_": [12, 75, 76], "constantli": [19, 20], "constraint_window": 66, "construct": [47, 95], "constructor": [9, 87], "consum": 67, "cont_act": [72, 73], "contact": 65, "contain": [1, 9, 10, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 65, 70, 71, 86], "content": [70, 71, 86], "continu": [6, 8, 12, 32, 41, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 70, 71, 72, 73, 76, 78, 89], "continuous_act": [54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 73], "contrast": 2, "contrib": 90, "contribut": [1, 41, 68, 70], "contributor": 70, "control": [2, 8, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 67, 70, 78, 91], "conv2d": [12, 75, 76, 89], "convei": 57, "conveni": [5, 6, 10, 43], "converg": 72, "convers": [5, 68, 70, 79, 80], "convert": [2, 3, 5, 6, 8, 10, 12, 70, 76, 90, 95], "convolut": [43, 72], "cook": 68, "cooper": [7, 8, 13, 30, 37, 38, 41, 47, 54, 64, 67, 70, 72, 93], "cooperative_pong": 39, "cooperative_pong_v5": [9, 39], "coordin": [20, 22, 29, 35, 38, 41, 43, 46, 63, 66, 67, 79, 80], "copi": [71, 79, 80, 94], "core": 70, "corner": [40, 46, 79], "correct": [11, 60, 70], "correctli": [2, 3], "correspond": [2, 8, 9, 10, 26, 40, 43, 44, 48, 52, 67], "costa": 75, "could": [2, 3, 9, 47, 51, 71], "count": [10, 17, 43, 45, 66, 71], "counter": [40, 71, 72, 73], "coupl": 13, "cours": 9, "court": 14, "cover": [56, 61], "cpu": [12, 71, 72, 73, 75, 76, 90, 92, 94, 97], "craft": 71, "crash": [11, 40], "craze": 13, "crazyfli": 68, "creat": [2, 3, 4, 6, 9, 10, 11, 26, 38, 47, 64, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 83, 85, 87, 89, 90, 91, 92, 93, 94, 95, 97], "creation": [9, 70, 83], "criteria": 71, "critic": [12, 41, 54, 70, 72, 73, 75, 76], "crop": 8, "crt": 8, "crypto": 54, "cuda": [12, 71, 72, 73, 75, 76, 94, 97], "cudnn": 75, "cumul": [8, 9], "current": [2, 3, 4, 6, 8, 9, 10, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 68, 70, 79, 80, 86, 90], "current_ag": 90, "curriculum": [70, 74], "curriculumenv": 71, "cursor": [27, 34], "custom": [2, 3, 4, 69, 70, 78, 79, 80, 81, 90], "custom_environ": [78, 79, 80, 81], "custom_environment_v0": [78, 79, 80], "custom_model": 87, "custom_test": 11, "customactionmaskedenviron": [80, 81], "customenviron": [78, 79, 81], "cycl": [2, 3, 4, 6, 9, 10, 40, 54, 66, 70, 79, 80], "cyclic": 10, "d": [40, 41, 43, 68, 71, 90, 92, 93], "d0": 71, "d1": 71, "danger": [19, 20], "daochen": 42, "data": [4, 10, 12, 47, 65, 70, 75, 76, 94, 95, 97], "databas": 86, "date": 10, "datetim": 71, "ddpg": 72, "dead": [8, 10, 19, 20, 45, 70, 92], "deadwood": 45, "deadwood_count": 45, "deal": 13, "death": [8, 19, 20, 24, 25, 26, 36, 37, 40, 65, 70, 92], "debug": [10, 11, 55, 87, 89], "decai": [71, 72, 73], "deceiv": 56, "decent": 90, "decentr": [3, 39, 65, 72], "decept": 7, "decid": [46, 71], "decis": [71, 85], "deck": [45, 47, 48, 51], "declar": [1, 10, 45], "deep": [8, 64, 71, 72, 73, 74, 87, 94, 96, 97], "deepcopi": [71, 94], "deepmind": [2, 68, 71], "def": [10, 12, 62, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 97], "default": [2, 3, 4, 8, 9, 10, 13, 39, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 75, 90, 94], "default_output_kei": 86, "defeat": 49, "defend": [22, 29, 36], "defens": 23, "defin": [8, 10, 11, 45, 46, 47, 71, 72, 73, 79, 80, 86, 90, 95], "definit": [2, 70, 71], "degre": 38, "delai": [8, 73], "delay_observations_v0": 8, "delet": [70, 71], "deliber": 71, "delta": [12, 75, 76], "demo": [68, 70, 71, 72, 73, 90, 92, 93], "demonstr": [70, 71, 86, 91, 95], "dendrit": 67, "dep": 70, "depend": [2, 9, 13, 18, 30, 37, 38, 42, 46, 47, 54, 64, 65, 67, 70, 71, 72, 73, 75, 76, 78, 86, 87, 89, 90, 92, 93, 94, 95, 97], "dependabot": 70, "depict": [50, 66, 67], "deploy": 78, "deprec": [4, 70, 79, 80], "deprecated_modul": 10, "deprecatedenv": 10, "deprecatedmodul": 10, "depreci": [68, 78], "depric": 70, "dequ": [71, 86], "deriv": 68, "describ": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 63, 66, 78], "descript": [45, 46, 47, 48, 50, 51, 65, 67, 68, 87, 89], "design": [2, 10, 12, 20, 68, 71, 72, 73, 75, 76, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "desir": [4, 71], "despit": 13, "destin": 54, "destroi": 67, "detail": [3, 45, 48, 51, 54, 91], "detect": [2, 11, 67, 90], "determin": [11, 13, 49, 71, 72, 73, 90], "determinist": [8, 11, 13, 72, 73, 75, 90, 92, 93], "dev": 75, "develop": [2, 3, 13, 68, 70, 85], "devic": [12, 71, 72, 73, 75, 76, 94, 97], "di": [9, 19], "diagon": [27, 43, 44, 52, 71], "diagram": 70, "diamond": [45, 50, 51], "dict": [2, 3, 9, 10, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 70, 71, 92, 94, 97], "dictat": 70, "dictionari": [3, 9, 10, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 72, 73], "did": 90, "die": [8, 9, 40, 92], "differ": [2, 3, 6, 11, 24, 27, 42, 45, 47, 49, 54, 58, 59, 66, 71, 85, 86], "difficult": [2, 18, 30, 68, 71, 90], "difficulti": 71, "dilemma": 7, "dim": 71, "dimens": [71, 72, 73], "dimension": [43, 90, 92, 93], "direct": [16, 21, 39, 40, 41, 43, 54, 67, 70, 71, 79], "directli": [2, 9, 23, 33, 41, 47, 64, 91], "directori": [4, 10, 70, 81], "dirhtml": 1, "dirnam": 71, "disabl": [10, 11, 70, 79, 80, 90], "disadvantag": 46, "disallow": 6, "disappear": 26, "discard": [45, 47], "discord": [68, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "discount": [71, 72, 73, 75], "discount_factor": 97, "discourag": 64, "discov": 71, "discret": [2, 8, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 66, 70, 71, 72, 73, 75, 79, 80, 87, 90, 91, 93], "discrete_act": [71, 72, 73], "discuss": 71, "disk": [90, 92, 93], "displai": [2, 3, 10, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 65, 66, 67], "distanc": [21, 40, 54, 55, 56, 58, 59, 61, 63, 67], "distribut": [2, 12, 65, 66, 67, 75, 76, 88], "distutil": 75, "diverg": 75, "divid": [20, 41, 90], "dm_control": 7, "dm_control_multiagent_compat": 7, "dm_soccer": 7, "dmcontrolmultiagentcompatibilityv0": 7, "dmytroivasiuk": 70, "do": [6, 8, 9, 11, 13, 40, 44, 54, 67, 68, 71, 75, 85, 86, 90, 91], "doc": [10, 70, 75, 78, 86], "docstr": 70, "doctest": 70, "document": [2, 3, 4, 7, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 45, 48, 51, 54, 56, 65, 70, 71, 72, 73, 74, 75, 77, 78, 79, 80, 83, 86, 87, 88, 89, 90, 92, 93, 96], "doe": [2, 4, 6, 8, 9, 11, 14, 18, 22, 27, 28, 29, 33, 34, 35, 47, 86, 90, 91, 92], "doesn": [56, 70, 90], "domain": [70, 73], "don": [8, 33, 62, 90], "done": [12, 25, 26, 36, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 75, 76, 85, 95], "door": 79, "doubl": [13, 71], "double_dunk": 18, "double_dunk_v3": 18, "doudizhu": 70, "down": [8, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 66, 67, 71, 79, 80], "downleft": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37], "downright": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37], "downscal": 13, "downstream": 9, "dqn": [70, 74, 88, 94, 96, 97], "dqn_torch_model": 87, "dqnagent": 87, "dqnconfig": 87, "dqnpolici": [94, 97], "dqntorchmodel": 87, "draft": 90, "draw": [43, 44, 45, 49, 52, 71, 72, 73], "drawer": [71, 72, 73], "drawn": 47, "drive": 68, "drop": [44, 47, 70], "dsctt": 70, "dtype": [8, 10, 71, 80, 86], "dtype_v0": [8, 89], "due": [8, 11, 13, 41, 43, 44, 46, 47, 49, 52, 68, 70], "duel": 87, "duke": 15, "dummi": [32, 79, 80, 87, 89], "dummyvectorenv": [94, 95, 97], "dunk": 13, "duplic": [13, 70], "durat": [65, 71, 72, 73, 89], "dure": [4, 9, 11, 70, 94], "dylwil3": 70, "dynam": [2, 4, 67], "dynamic_resc": [55, 56, 57, 58, 59, 60, 61, 62, 63], "e": [1, 2, 3, 6, 8, 9, 30, 40, 41, 43, 54, 65, 70, 71, 79, 80, 81, 86], "each": [2, 3, 9, 10, 12, 13, 15, 18, 20, 22, 25, 26, 27, 29, 30, 35, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 75, 76, 78, 79, 80, 90, 92, 93, 95], "earlier": [71, 90, 94], "earn": [24, 25], "easi": [4, 6, 10, 71, 92], "easier": [47, 70, 75], "easili": [19, 20, 71, 90], "easy_env": 90, "edg": [39, 40, 43, 65], "effect": [20, 21, 80], "effici": 6, "efg": [2, 70], "egorov": 64, "eight": 43, "either": [2, 4, 14, 21, 22, 25, 28, 35, 39, 40, 41, 44, 46, 47, 49, 52, 70], "elast": [39, 41], "elect": 71, "element": [8, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 67, 70], "elif": [2, 38, 71, 79, 80], "elit": [71, 72, 73], "elite_opp": 71, "elliot": [7, 75, 90, 92, 93], "elliottow": [70, 75, 90, 92, 93], "els": [2, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 71, 72, 73, 74, 75, 76, 86, 87, 89, 90, 92, 93, 94, 97], "elsewher": 10, "em": [70, 86, 87], "embed": 87, "emerg": [38, 41, 54], "emit": 6, "empti": [9, 10, 44, 46, 70], "en": [43, 70, 90, 92, 93], "enabl": [8, 26, 40, 67, 70, 71, 72, 73, 75, 90], "encod": [8, 43, 46, 47, 48, 49, 52], "encounter_reward": 67, "encourag": [9, 11, 13, 70, 71], "encrypt": 57, "end": [2, 3, 6, 12, 13, 15, 19, 20, 30, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 67, 70, 71, 75, 76, 85, 90], "end_dim": [12, 76], "end_step": [12, 76], "enemi": 24, "enforc": [6, 70], "engin": [41, 68, 70, 71, 91, 96], "enh": 70, "enhanc": 72, "enough": [2, 11], "ensur": [1, 9, 45, 70, 71], "ent": 75, "ent_coef": [12, 75, 76], "entir": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 45, 70], "entireti": 78, "entiti": [40, 67, 75], "entomb": [13, 19, 20], "entombed_competit": 19, "entombed_competitive_v3": 19, "entombed_coop": [20, 70], "entombed_cooperative_v3": 20, "entri": [9, 10, 48, 50, 51], "entropi": [12, 75, 76], "entropy_coeff": 89, "entropy_loss": [12, 75, 76], "enumer": [12, 65, 67, 71, 75, 76], "env": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 81, 86, 87, 88, 89, 90, 92, 93, 94, 95, 97], "env_creat": [87, 89], "env_defined_act": [72, 73], "env_don": 70, "env_fn": [11, 90, 92, 93], "env_func": 11, "env_id": 75, "env_kwarg": [90, 92, 93], "env_logg": 4, "env_max": [8, 89], "env_min": [8, 89], "env_nam": [87, 89], "env_reward": 71, "env_step": [94, 97], "env_trunc": 10, "environ": [2, 3, 4, 5, 6, 8, 12, 38, 39, 40, 41, 42, 43, 44, 45, 46, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 74, 77, 78, 80, 85, 91], "environment_paramet": 9, "environmentcr": 70, "ep": [12, 71, 72, 73, 75, 76, 94], "episod": [4, 12, 40, 57, 70, 71, 72, 73, 74, 75, 76, 95], "episode_num": [71, 72, 73], "episode_per_test": 97, "episodes_per_epoch": 71, "episodic_length": 75, "episodic_return": 75, "epoch": [71, 75, 94, 97], "eps_decai": [71, 72, 73], "eps_end": [71, 72, 73], "eps_test": 94, "eps_train": 94, "epsilon": [71, 72, 73, 87], "epsilon_timestep": 87, "epsilongreedi": 87, "equal": [42, 45, 47, 65, 71], "equival": [2, 3, 6, 8, 9], "erik": 13, "error": [2, 4, 6, 9, 10, 11, 47, 70, 71, 87, 89], "error_agent_iter_before_reset": 4, "error_nan_act": 4, "error_observe_before_reset": 4, "error_possible_agents_attribute_miss": 4, "error_render_before_reset": 4, "error_state_before_reset": 4, "error_step_before_reset": 4, "escap": [19, 20, 79, 80], "escape_i": [79, 80], "escape_x": [79, 80], "especi": [8, 70], "essenti": [24, 37], "establish": 4, "estim": 75, "estimation_step": 97, "et": [8, 13], "etc": [8, 10, 11, 70, 86], "euclidean": [55, 56, 67], "ev": [54, 57], "evad": 66, "evader_spe": 67, "eval": [12, 71, 76, 92, 93, 94], "eval_action_mask": 90, "eval_actions_dict": 71, "eval_actions_hist": 71, "eval_oppon": 71, "eval_turn": 71, "evalu": [4, 8, 11, 13, 70, 71, 72, 73], "eve_0": 57, "even": [2, 10, 13, 90], "evenli": 67, "eventu": 30, "everi": [1, 2, 3, 6, 9, 13, 41, 63, 66, 67, 70, 71, 93, 95], "everyon": 70, "everyth": [13, 40, 71], "evo": 71, "evo_epoch": [71, 72, 73], "evo_loop": [71, 72, 73], "evo_step": [71, 72, 73], "evohpo": 71, "evolut": [71, 72, 73], "evolutionari": [71, 72, 73, 74], "evolv": [2, 71, 72, 73], "exact": 54, "exactli": 49, "exampl": [1, 4, 6, 11, 13, 43, 45, 46, 47, 49, 67, 70, 71, 75, 79, 80, 83, 85, 86, 87, 90, 91, 92, 94, 95, 97], "exce": 67, "exceed": 70, "exceedingli": [12, 76], "except": [3, 6, 8, 9, 13, 43, 44, 45, 46, 47, 48, 50, 51, 52, 60, 63, 72, 73, 86, 90, 92, 93], "excit": [70, 71], "exclud": 45, "exclus": 2, "execut": [1, 2, 3, 8, 9, 12, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 65, 66, 67, 75, 76, 79, 80, 91, 95], "exert": 65, "exist": [6, 8, 11, 40, 44, 47, 70], "exist_ok": [71, 72, 73, 97], "exit": [26, 33, 62, 87, 89, 90, 92, 93], "exp": [12, 62, 75, 76], "exp_nam": 75, "expand": 70, "expand_dim": [71, 72, 73, 87], "expandus": [87, 89], "expans": [49, 70], "expect": [24, 90, 94], "experi": [71, 72, 73, 75, 77], "experiment": 40, "explain": [12, 76], "explained_var": [12, 75, 76], "explained_vari": 75, "explicitli": [2, 47], "exploit": 71, "explor": [20, 71, 72, 73, 87], "exploration_config": 87, "exploration_nois": [94, 97], "express": 43, "extend": [2, 72, 73, 86, 94], "extens": [2, 13, 71], "extern": [4, 5, 7, 70, 85], "extra": [49, 70], "extract": 87, "extractor": [90, 92, 93], "ezpickl": 70, "f": [12, 40, 43, 71, 72, 73, 75, 76, 79, 80, 86, 90, 92, 93, 94, 97], "f1tenth": 68, "f841": 86, "face": 70, "facilit": 43, "fact": [8, 17], "factor": [9, 41, 65, 67, 71, 72, 73, 75], "fail": [11, 65, 70], "fairli": 27, "fall": [36, 44, 65], "fall_reward": 65, "fallen": 65, "fals": [4, 8, 9, 10, 11, 12, 13, 17, 30, 39, 40, 41, 45, 47, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 92, 94, 97], "famili": 9, "familiar": [7, 18], "fan": 18, "fantast": 9, "far": [20, 47, 58, 61, 86], "farama": [7, 10, 13, 38, 68, 70, 79, 80, 90], "fast": [71, 96], "fast_bomb": 30, "faster": [8, 13, 16, 30, 62, 70, 74], "fastrand": [71, 72, 73], "favicon": 70, "favor": [70, 94], "fcnet": 87, "feat": 71, "featur": [9, 11, 43, 47, 54, 67, 70, 77, 90, 92, 93], "feel": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "fernadoo": 70, "fetch": 85, "few": [8, 10, 13, 18, 42, 68, 91], "ffelten": 70, "field": [17, 71], "field_nam": [71, 72, 73], "fig1": [71, 74], "file": [1, 4, 12, 70, 76, 77, 81, 94], "filenam": [72, 73], "filipinogambino": 70, "fill": [8, 32, 44, 71, 72, 73], "fill_replay_buff": 71, "final": [40, 43, 47, 49, 71, 72, 73, 90, 94], "final_epsilon": 87, "find": [10, 19, 20, 43, 71], "fine": 90, "finish": [70, 71, 90, 92, 93], "finit": 8, "fire": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 40], "firebal": 25, "firework": 47, "first": [2, 4, 6, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 78, 85, 91], "first_0": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "fit": [6, 71, 72, 73], "fix": [16, 19, 20, 24, 25, 26, 27, 29, 34, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 64, 65, 66, 67, 70, 75], "flag": [13, 65, 86], "flag_captur": 21, "flag_capture_v2": 21, "flake8": [70, 75], "flash": [8, 70], "flatten": [8, 12, 43, 71, 75, 76, 89], "flatten_v0": 8, "flexibl": [2, 68], "fli": 30, "flicker": 13, "flight": 16, "flip": [25, 27, 71], "float": [2, 3, 4, 6, 12, 45, 46, 67, 71, 75, 76, 94], "float16": 8, "float32": [8, 86, 89], "float64": 8, "float_max": 87, "floor": [25, 35], "flush": 4, "fly": 16, "fmt": 75, "focus": [71, 74], "fold": [43, 48, 50, 51, 70], "folder": [1, 4, 70, 75], "follow": [1, 2, 3, 5, 6, 8, 9, 10, 13, 27, 43, 46, 47, 48, 49, 50, 51, 52, 54, 62, 68, 70, 71, 72, 73, 74, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "font": 71, "food": [63, 67], "food_reward": 67, "footbal": 68, "foozbal": 22, "foozpong": [13, 70], "foozpong_v3": 22, "forc": [32, 65], "forest": 63, "forev": [30, 67, 70], "form": [2, 40, 47, 54, 66, 67, 70], "formal": 2, "format": [10, 70, 71, 86, 95], "forth": [10, 30], "fortress": 36, "forward": [40, 80, 87, 89], "forward_reward": 65, "found": [1, 11, 43, 44, 45, 46, 47, 48, 50, 51, 52, 71, 75, 90, 92, 93], "foundat": [7, 13, 68, 70], "four": [13, 22, 29, 35, 36, 40, 42, 54, 70, 74, 78, 79, 88, 91], "fourth_0": [22, 29, 35, 36], "fp": [8, 70], "frac": 75, "fraction": [12, 71, 76], "frame": [3, 5, 8, 9, 13, 18, 34, 43, 46, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 70, 71, 72, 73, 74, 91, 92, 95], "frame_list": 89, "frame_no": 71, "frame_s": [12, 76], "frame_skip": [8, 13], "frame_skip_v0": [8, 13, 72, 75], "frame_stack_v1": [8, 12, 13, 72, 75, 76, 89, 92], "frames_per_second": 70, "frameskip": 8, "framework": [74, 85, 87, 89, 96], "free": [71, 72, 73, 75, 76, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "freeze_evad": 66, "freq": [71, 94], "frequenc": [71, 72, 73], "frequent": 2, "frequneci": 73, "friction": 41, "friendli": [70, 77], "from": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 75, 76, 77, 78, 79, 80, 81, 83, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "from_checkpoint": [87, 89], "from_parallel": [10, 70], "fromarrai": [71, 72, 73, 89], "front": [23, 40, 65, 80], "full": [8, 10, 13, 44, 47, 51, 66, 67, 70, 75, 79, 83, 92, 94, 96], "full_action_spac": 13, "full_column": 71, "fulli": [8, 66, 70], "fullyconnectednetwork": 87, "fun": 79, "function": [2, 4, 5, 6, 9, 10, 11, 39, 40, 41, 43, 44, 45, 46, 47, 49, 52, 62, 63, 65, 66, 67, 68, 70, 71, 72, 73, 75, 78, 86, 87, 90, 94, 97], "functool": [10, 79, 80], "further": [71, 72, 73], "futur": 47, "g": [2, 3, 8, 13, 43, 54, 70, 71, 79, 80, 81], "g1": 43, "gae": 75, "gae_lambda": 75, "gain": 25, "game": [2, 3, 4, 6, 7, 8, 9, 10, 11, 14, 15, 16, 17, 18, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 70, 71, 74, 75, 79, 80, 86, 90, 91, 92, 93, 95, 96], "game_nam": 7, "game_vers": [16, 26, 28], "gamma": [12, 71, 72, 73, 75, 76, 89, 94], "gather": 70, "gen_envs_md": 1, "gener": [1, 2, 3, 7, 8, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 69, 70, 75, 80, 86], "generated_ag": [2, 70], "get": [4, 9, 10, 12, 14, 17, 19, 20, 21, 22, 23, 27, 28, 29, 33, 35, 37, 38, 41, 43, 45, 51, 55, 59, 70, 71, 72, 73, 76, 79, 80, 87, 89, 90, 92, 93, 94], "get_action_and_valu": [12, 75, 76], "get_ag": 94, "get_arg": 94, "get_doc": 86, "get_env": 94, "get_logg": 4, "get_pars": 94, "get_polici": 87, "get_valu": [12, 75, 76], "getact": [71, 72, 73], "getctim": [90, 92, 93], "getcwd": 4, "getmodul": 86, "getvalu": 4, "gg": 70, "gif": [70, 71, 72, 73, 89], "gif_path": [71, 72, 73], "gin": [42, 70], "gin_reward": 45, "gin_rummi": 45, "gin_rummy_v4": [45, 90], "git": [94, 95, 97], "github": [7, 12, 64, 70, 71, 72, 73, 74, 75, 76, 78, 87, 89, 90, 91, 92, 93, 94, 95, 97], "gitlab": 70, "give": [6, 10, 11, 14, 21, 22, 28, 29, 35, 41, 42, 47, 59, 63, 65, 70, 86, 91], "given": [2, 4, 6, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 41, 42, 46, 47, 49, 86], "glitch": 39, "glob": [90, 92, 93], "global": [3, 9, 39, 40, 41, 59, 61, 65, 67], "global_reward": 41, "global_step": [71, 75], "go": [1, 42, 45, 70, 71, 80, 85, 90], "go_v5": [46, 90], "goal": [22, 25, 27, 32, 33, 41, 54, 86], "goal_id": [59, 60], "goal_landmark_id": 58, "goal_rel_posit": [56, 58], "gobblet": 70, "goe": [39, 45, 65], "good": [11, 17, 54, 56, 57, 58, 62, 63, 70], "googl": [68, 70], "gpu": [90, 93], "grad": 75, "grad_clip": 89, "grade": 88, "gradient": [2, 72, 73, 75], "gradio": 68, "grai": 60, "grand": 71, "graph": 2, "graphic": [8, 10, 11], "grayscal": 13, "grayscale_imag": 13, "greater": [49, 51], "greater_equ": 71, "greedi": 27, "greedili": 27, "green": [47, 54, 56, 62, 67], "greyscal": 8, "grf": 68, "grid": [40, 44, 52, 66, 68, 79, 80], "gridworld": 3, "ground": [54, 65], "grow": 54, "gt": 70, "gtp": 46, "guarante": 68, "guard": [79, 80], "guard_act": [79, 80], "guard_action_mask": 80, "guard_i": [79, 80], "guard_x": [79, 80], "gui": 70, "guid": [10, 70, 71, 74, 78], "guided_missil": 16, "guo": 42, "gupta": 64, "gupta2017coop": 64, "gym": [2, 3, 13, 70, 75], "gymnasium": [2, 5, 7, 8, 9, 10, 69, 70, 71, 72, 73, 75, 79, 80, 87, 90, 94, 97], "gymnasium_ag": 86, "gymnasiumag": 86, "h": [43, 71, 72, 73, 90, 92, 93], "ha": [4, 8, 9, 11, 12, 13, 18, 22, 25, 26, 30, 40, 43, 44, 46, 47, 52, 58, 59, 61, 66, 67, 70, 71, 74, 75, 76, 81, 90, 92, 93], "had": [10, 66], "half": [39, 49, 51], "halv": 20, "hanabi": [42, 70, 90], "hanabi_v4": 70, "hanabi_v5": [47, 70, 90], "hand": [9, 10, 45, 47, 48, 49, 50, 51, 70], "hand_siz": 47, "handl": [2, 4, 8, 9, 10, 13, 19, 20, 23, 24, 25, 26, 36, 37, 40, 65, 70, 78, 80, 92], "happen": [71, 90], "harb": 54, "hard": [2, 70, 71, 85], "hard_env": 90, "harder": 71, "hardwar": 13, "hari": 8, "has_maz": 17, "hasattr": 94, "hausknecht": 13, "have": [2, 3, 4, 6, 8, 9, 11, 12, 13, 15, 17, 18, 26, 27, 37, 42, 43, 44, 47, 49, 54, 56, 57, 65, 66, 67, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "he": 93, "head": [40, 65], "hear": 54, "heart": [45, 50, 51], "hearthston": 68, "heavili": 90, "height": [12, 40, 41, 71, 76], "held": 34, "help": [9, 10, 20, 25, 43, 63, 69, 70, 71, 72, 73, 75, 76, 85, 86, 87, 89, 90, 92, 93, 94, 95, 97], "helper": [4, 78], "helpingstar": 70, "here": [10, 13, 71, 79, 80, 86, 92, 95], "herng": 42, "heterogen": 8, "heurist": 27, "hidden": [12, 21, 54, 71, 72, 73, 75, 76, 87, 94], "hidden_s": [71, 72, 73, 94, 97], "hide": 63, "high": [8, 9, 30, 38, 61, 72, 73, 77, 87, 96], "higher": [32, 35, 40, 41, 71], "highest": 71, "highli": [8, 9, 38, 41, 70, 77], "hint": [21, 47, 70, 96], "hip": 65, "histogram": 71, "hit": [4, 16, 17, 24, 25, 27, 30, 31, 36, 37, 40, 62], "hoard": 30, "hockei": 13, "hoffmann": 70, "hold": [10, 18, 43, 44, 45, 46, 47, 52, 70, 79, 80, 86, 87, 90], "holdem": [42, 70, 87, 88, 90], "homepag": 70, "homogen": 8, "hook": 70, "hoop": 14, "hope": 13, "hopefulli": 70, "horizont": [44, 52, 65, 67, 71], "horizontal_thrust": 67, "hot": [8, 47], "hotfix": 70, "hour": 70, "hover": 34, "how": [1, 2, 11, 19, 20, 24, 25, 26, 30, 36, 37, 39, 40, 41, 46, 54, 55, 56, 61, 65, 70, 71, 72, 73, 75, 76, 77, 80, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 97], "howev": [2, 9, 24, 29, 30, 47, 49, 71, 86], "hpo": [71, 72, 73, 74], "html": [12, 53, 75, 76, 90, 92, 93], "http": [7, 10, 12, 64, 70, 71, 72, 73, 75, 76, 79, 80, 87, 89, 90, 91, 92, 93, 94, 95, 97], "hu": 42, "huang": [2, 42], "huge": 11, "huggingfac": [68, 70], "hull": 65, "human": [2, 3, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 71, 76, 86, 90, 92, 93, 94, 95], "humanmessag": 86, "hunt": 68, "hyper": [71, 72, 73, 74], "hyperparam": [71, 72, 73], "hyperparamet": [71, 72, 73, 75, 77, 90], "i": [1, 2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 74, 75, 76, 77, 78, 79, 80, 81, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97], "ic": 13, "ice_hockei": 23, "ice_hockey_v2": 23, "iclr": 91, "id": [8, 9, 10, 45, 46, 47, 48, 50, 51, 72, 73, 75, 94], "ideal": 13, "ident": [20, 26], "identifi": [8, 13, 43, 54, 86], "idx": 75, "idx_epi": [71, 72, 73], "idx_step": 71, "ignor": 8, "igor": 54, "illeg": [2, 4, 6, 9, 10, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 71, 86, 90], "illegal_reward": [6, 7], "im": [71, 72, 73], "imag": [4, 8, 13, 41, 43, 70, 71, 72, 73, 89], "imagedraw": [71, 72, 73], "imagefont": 71, "imageio": [71, 72, 73], "imagin": 71, "img": [71, 89], "img_res": 71, "immedi": [20, 65, 71], "impact": 70, "implement": [2, 3, 6, 7, 8, 9, 11, 13, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 52, 65, 66, 67, 68, 70, 74, 77, 78, 83, 85, 86, 88, 91], "impli": 9, "import": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 72, 73, 75, 76, 78, 79, 80, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "import_modul": 75, "importlib": 75, "importorskip": 90, "imposs": 80, "imprecis": [41, 70], "improv": [65, 70, 71], "inaccuraci": 26, "incl": 90, "includ": [2, 5, 6, 9, 10, 39, 45, 47, 53, 54, 64, 65, 68, 69, 70, 74, 75, 77, 78, 83, 85], "inclus": 44, "inconveni": 70, "incorpor": 43, "incorrect": [9, 70], "increas": [8, 49, 70, 71, 74, 85], "increasingli": 71, "indefinit": [14, 18, 22, 27, 28, 29, 33, 34, 35], "independ": [71, 88], "index": [43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 67, 70, 71], "indi_agent_reward": [72, 73], "indic": [8, 11, 12, 44, 47, 52, 66, 67, 76, 86], "individu": [7, 12, 65, 76], "industri": 88, "inf": [55, 56, 57, 58, 59, 60, 61, 62, 63, 65], "inf_mask": 87, "infer": [10, 47, 71, 72, 73, 79, 80], "infin": 62, "info": [2, 3, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93], "inform": [1, 2, 3, 7, 8, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 74, 77, 86, 87, 88, 89, 90, 91, 92, 93], "inher": 46, "inherit": [6, 10], "inidivdu": [72, 73], "init": [10, 12, 71, 75, 76, 79, 80, 87, 89], "init_hp": [71, 72, 73], "initi": [6, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 71, 72, 73, 79, 80, 90], "initial_epsilon": 87, "initialpopul": [71, 72, 73], "inproceed": 64, "input": [5, 6, 10, 38, 54, 67, 71, 72, 73], "input_dict": [87, 89], "insert": [2, 3, 6, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69], "insid": [8, 63], "inspect": [11, 86], "inspir": [12, 68, 76], "instal": [1, 7, 8, 10, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "instantan": [2, 9], "instanti": [71, 72, 73], "instantli": 90, "instead": [4, 6, 8, 10, 13, 17, 40, 43, 47, 70, 71], "institut": 71, "instruct": [70, 75, 86], "instrument": 13, "insuffici": [43, 70], "int": [2, 3, 4, 10, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 70, 71, 75, 86, 87, 89, 90, 92, 93, 94], "int64": 10, "int8": [80, 86], "integ": [2, 3, 9, 10, 43, 44, 47, 49, 50, 70, 90], "integr": [70, 75, 78, 85], "intellig": [13, 64], "intend": [4, 11, 55, 68, 81, 91], "intens": [8, 90], "intent": [12, 76], "interact": [2, 3, 4, 7, 10, 38, 54, 69, 70, 71, 85, 86], "interest": [27, 70, 71], "interfac": [9, 68, 69, 85, 91, 95], "intermit": 8, "intern": [2, 4, 9, 10, 11, 64, 79, 80], "internal_render_mod": 10, "internet": 86, "interpol": 8, "intersect": 46, "interv": 71, "introduc": [8, 13, 71], "introduct": 96, "introductori": 74, "invad": [8, 13, 72], "invalid": [2, 80, 90], "invis": [17, 20, 30], "invisible_invad": 30, "involv": [24, 51, 85], "io": [90, 91, 92, 93], "is_avail": [12, 71, 72, 73, 75, 76, 94, 97], "is_first": 4, "is_invis": 17, "is_last": [4, 10], "is_paralleliz": 70, "is_vector_env": 75, "isinst": [2, 11, 75, 94, 97], "isort": [70, 86], "issu": [2, 10, 11, 27, 40, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "item": [12, 67, 72, 73, 75, 76, 86, 90], "item_1": 10, "item_2": 10, "iter": [9, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 71], "its": [8, 9, 10, 11, 25, 39, 40, 42, 45, 46, 47, 48, 49, 51, 54, 65, 71, 94], "itself": [9, 40, 66, 71, 87, 89, 90], "j": [8, 13, 40, 48, 66], "jab": 15, "jack": 48, "jacob975": 70, "jammf": 70, "jayesh": 64, "jean": 54, "jet": [7, 12, 16, 76], "jjshoot": [12, 70, 76], "joel": 13, "join": [70, 71, 72, 73, 75, 94, 97], "joint": 65, "jordan": 7, "joschu": [12, 75, 76], "journal": [8, 13, 42, 54], "joust": 13, "joust_v3": 24, "jump": [34, 35], "jun": [7, 13], "junyu": 42, "just": [8, 9, 10, 11, 40, 90], "k": [8, 13, 40, 45, 47, 48, 50, 51, 64, 66, 75], "kallinteri": 70, "kaz": 70, "kchour": 70, "keep": [8, 16, 25, 39, 54, 65, 67, 71, 78, 81, 90], "kei": [2, 3, 9, 15, 16, 17, 31, 39, 40, 41, 57, 66, 70, 72, 73, 75, 77, 90, 92, 93], "kept": 10, "kernel": [71, 72], "kernel_s": [71, 72], "kick": 25, "kill": [4, 40], "killable_arch": 40, "killable_knight": 40, "king": [43, 45, 48], "kingsid": 43, "kir0ul": 70, "kl": [12, 75, 76], "knee": 65, "knight": [2, 4, 13, 38, 43, 70, 91], "knight_0": 40, "knight_1": 40, "knights_archers_zombi": [10, 40, 70], "knights_archers_zombies_v0": 10, "knights_archers_zombies_v10": [9, 10, 38, 40, 69, 92], "knock": [25, 45], "knock_reward": 45, "know": [56, 71], "knowledg": 47, "known": [8, 27, 45, 59], "ko": 15, "kochenderf": 64, "komi": 46, "kw": 87, "kwarg": [4, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 87, 89, 90], "kwei": 42, "l": [40, 75], "laboratori": 64, "lai": 42, "laid": 78, "lambda": [11, 75, 86, 87, 89, 94, 95], "lambda_": 89, "landmark": [54, 55, 56, 57, 58, 59, 60, 61, 62, 63], "landmark_id": [58, 59], "landmark_rel_posit": [55, 56, 61, 62, 63], "langchain": 70, "languag": [54, 85], "laptop": [90, 92], "larg": [2, 62, 65, 67, 70, 96], "largest": [8, 47, 49, 90], "last": [2, 4, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 86, 87, 89, 90, 92, 93], "last_opp_mov": 71, "lastgaelam": 75, "latest": [43, 71], "latest_polici": [90, 92, 93], "launch": [13, 38, 42, 54, 64, 90, 92, 93], "layer": [9, 12, 22, 71, 72, 73, 75, 76], "layer_init": 75, "layout": 43, "ldot": 46, "leadadversary_0": 63, "leader": 63, "leader_comm": 63, "leaderboard": 77, "leaf": 2, "learn": [2, 3, 5, 7, 8, 12, 13, 27, 38, 39, 41, 42, 56, 57, 58, 61, 64, 68, 69, 70, 72, 73, 74, 75, 76, 77, 88, 90, 91, 92, 93, 94, 96], "learn_step": [71, 72, 73], "learnabl": 70, "learner": [12, 76], "learning_r": [75, 93], "least": [10, 27, 47, 78, 96], "leav": [2, 13, 26, 30, 32], "leduc": [42, 70, 87, 90], "leduc_holdem": 48, "leduc_holdem_v4": [48, 87, 90], "leduoc": 87, "leela": [70, 88], "leelachesszero": 43, "left": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 46, 47, 54, 65, 66, 70, 71, 79, 80], "left_paddle_spe": [9, 39], "leftmost": 65, "leg": 65, "legal": [42, 71, 86], "legal_mov": 47, "len": [10, 12, 71, 72, 73, 76, 89, 92, 93, 94, 97], "length": [2, 3, 8, 9, 12, 46, 47, 65, 67, 71, 76, 94], "less": [13, 30, 71, 92], "lesson": 71, "lesson1_trained_ag": 71, "lesson2_trained_ag": 71, "lesson3_trained_ag": 71, "lesson4_trained_ag": 71, "lesson_numb": 71, "let": [33, 71, 91], "level": [9, 30, 32, 37, 61, 71, 81], "leverag": [92, 93], "librari": [9, 13, 42, 68, 70, 74, 77, 88, 91], "lidar": 65, "life": [20, 24, 25, 37, 47, 70], "lightweight": [9, 77, 96], "like": [2, 3, 8, 9, 10, 11, 12, 13, 17, 22, 39, 40, 43, 47, 54, 65, 68, 70, 71, 76, 86, 87, 89, 90], "limit": [2, 4, 42, 48, 67, 70], "line": [10, 12, 40, 52, 67, 70, 71, 76, 79, 80, 91, 96], "line_death": 40, "linear": [8, 12, 75, 76, 89], "linear_interp": 8, "linearli": 8, "link": [68, 70], "lint": 70, "linux": 9, "list": [2, 3, 4, 9, 10, 12, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 71, 72, 73, 76, 90, 94, 97], "listen": [54, 59, 73, 74], "listener_0": 60, "liter": 32, "littl": 39, "live": [3, 6, 10, 25, 30, 37, 70], "lizard": [49, 70], "load": [7, 70, 71, 72, 73, 87, 89, 90, 92, 93, 94, 95], "load_state_dict": [71, 94], "loadcheckpoint": [71, 72, 73], "local": [41, 59, 61, 67, 70], "local_dir": 89, "local_ratio": [41, 59, 61, 65, 67, 70], "local_reward": 41, "locat": [21, 27, 44, 46, 63, 67, 71, 81], "locomot": 7, "log": [4, 12, 70, 71, 75, 76, 87, 96, 97], "log_level": [87, 89], "log_path": 94, "log_prob": [12, 75, 76], "logdir": 94, "logger": [4, 10, 94], "logic": [5, 6, 10, 12, 47, 70, 75, 76, 78, 83], "logical_and": 71, "logit": [12, 75, 76, 87], "logo": 70, "logprob": [12, 75, 76], "logratio": [12, 75, 76], "long": [11, 12, 15, 27, 32, 75, 76, 85, 90], "longer": [8, 10, 14, 18, 20, 22, 27, 28, 29, 33, 34, 35, 40, 41, 70, 92], "longest": [19, 39, 90], "look": [2, 9, 10, 11, 13, 26, 40, 70, 71], "loop": [2, 68, 70, 72, 73, 89], "lose": [4, 6, 19, 20, 24, 25, 26, 37, 42, 45, 47, 71, 86], "loser": [43, 45, 46, 48, 49, 50, 51, 52], "loss": [12, 42, 47, 75, 76, 90], "loss_avoiding_act": 71, "lost": [47, 67], "lot": 85, "low": [8, 54, 71, 72, 73, 87], "lowe2017multi": 54, "lower": [9, 40, 41], "lower_bound": [8, 72, 75], "lowest": 47, "lr": [12, 71, 72, 73, 75, 76, 89, 94, 97], "lr_actor": [72, 73], "lr_critic": [72, 73], "lrnow": 75, "lru_cach": [10, 79, 80], "lst": 71, "lurk": [19, 20], "m": [1, 13, 40, 51, 71, 90, 92, 93], "mace": 40, "machado": [8, 13], "machado2018revisit": 13, "machin": 68, "maco": [9, 70], "maddpg": [70, 74], "maddpg_trained_ag": 72, "made": [1, 4, 44, 64, 65, 68, 70, 86], "madrl": [8, 64], "magent": 70, "magent2": [2, 70], "magnitud": [8, 67], "mahjong": 70, "mai": [2, 3, 9, 10, 43, 46, 67, 68, 71, 90], "main": [3, 25, 26, 43, 44, 45, 46, 47, 48, 50, 51, 52, 56, 85, 86], "maintain": [43, 68, 70], "major": [64, 67, 68, 70], "make": [1, 2, 4, 6, 8, 9, 11, 20, 27, 30, 39, 40, 41, 43, 44, 45, 46, 47, 49, 52, 54, 65, 66, 67, 70, 71, 74, 81, 85], "makedir": [71, 72, 73, 97], "man": 36, "manag": [4, 71, 85], "maneuv": 23, "mani": [2, 4, 8, 11, 40, 42, 68, 70, 71, 77, 80, 86, 90], "manner": [6, 54], "manu": 70, "manual": [2, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 67, 70], "manual_control": 70, "manual_polici": [38, 70], "manual_se": [75, 94, 97], "manualpolici": 38, "map": [10, 16, 17, 20, 21, 26, 27, 31, 47, 54, 66, 70, 71], "marc": 13, "mario": 13, "mario_bro": 25, "mario_bros_v3": 25, "maritim": 68, "mark": [2, 7, 52, 90], "markdown": [1, 70], "markov": 71, "markovvectorenv": 92, "marl": [2, 8, 69, 94, 97], "marlo": 13, "mask": [8, 10, 42, 70, 71, 83, 87, 91], "mask_fn": 90, "maskabl": 90, "maskableactorcriticpolici": 90, "maskableppo": 90, "mass": 41, "massiv": [68, 70], "master": [32, 70, 71, 75, 90, 92, 93], "mat": 70, "match": [4, 10, 33, 68, 70, 87, 94], "matd3": [70, 74], "matd3_trained_ag": 73, "materi": [43, 70], "matrix": [7, 40], "matter": [9, 11], "matthew": 13, "max": [8, 12, 13, 47, 70, 71, 72, 73, 75, 76, 90, 92, 93], "max_act": [71, 72, 73], "max_arrow": 40, "max_batch_s": [71, 72], "max_cycl": [9, 11, 12, 13, 39, 40, 41, 49, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 76, 86, 89, 92], "max_cycles_test": 11, "max_episod": [4, 71, 72, 73], "max_epoch": 97, "max_fram": 70, "max_grad_norm": 75, "max_information_token": 47, "max_it": 9, "max_learn_step": [71, 72], "max_length": 71, "max_life_token": 47, "max_lr": [71, 72], "max_num_ag": [2, 3, 9], "max_observation_v0": [8, 13, 75], "max_reward": 39, "max_skip": 8, "max_step": [4, 71, 72, 73], "max_train_episod": 71, "max_zombi": [40, 92], "maxandskip": [8, 13], "maxim": [13, 27, 30, 64, 86], "maximis": 71, "maximum": [8, 13, 40, 47, 65, 67, 70, 71, 72, 73, 75], "maxlen": [71, 86], "maxpool2d": [12, 76], "maxsiz": [10, 79, 80], "maze": [13, 17, 19, 20], "maze_craz": 26, "maze_craze_v3": 26, "mb_advantag": 75, "mb_ind": 75, "mclean": 70, "md": [1, 70, 78], "mean": [9, 10, 12, 14, 18, 20, 22, 27, 28, 29, 33, 34, 35, 37, 40, 41, 44, 49, 54, 56, 65, 66, 70, 71, 72, 73, 75, 76, 78, 94], "mean_fit": 71, "mean_reward": [94, 97], "mean_scor": 71, "mean_turn": 71, "mean_turns_per_gam": 71, "mechan": 8, "medium_env": 90, "meet": 70, "meltingpot": 68, "meltingpot_compat": 7, "meltingpotcompatibilityv0": 7, "mem_ful": 71, "member": 71, "memoiz": [10, 79, 80], "memor": 13, "memori": [8, 21, 26, 71, 72, 73], "memory_s": [71, 72, 73], "mental": 2, "merg": [49, 70], "messag": [4, 9, 11, 54, 57, 70], "message_histori": 86, "metadata": [10, 70, 71, 78, 79, 80, 90, 92, 93], "method": [3, 8, 9, 10, 11, 39, 43, 54, 65, 70, 71, 79, 80, 90], "metric": 85, "mgoulao": 70, "michael": [13, 72, 73], "microwrapp": 8, "middl": 79, "might": 71, "mikcnt": 70, "mikepratt1": [70, 72, 73], "million": 75, "mimwrit": [71, 72, 73], "min": [62, 71], "min_act": [71, 72, 73], "min_batch_s": [71, 72], "min_learn_step": [71, 72], "min_lr": [71, 72], "min_skip": 8, "mind": 54, "mini": 75, "miniatur": 68, "minibatch": 75, "minibatch_s": 75, "minigo": 46, "minim": [15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 31, 33, 37, 47, 70, 78, 95, 97], "minimap": 70, "minimum": [8, 50, 51, 61, 63, 67, 71, 90], "minor": [40, 41, 54, 70], "minut": [15, 90, 92, 93], "mirror": 75, "misc": [39, 40, 41, 65, 66, 67, 70], "miscellan": 70, "missil": 16, "mistak": 71, "mistakenli": 70, "misus": 70, "mix": [24, 25, 54], "mixtur": 54, "ml": [68, 70, 88, 94, 95, 97], "mlp": [71, 72, 73, 90, 91, 93], "mlppolici": [92, 93], "mode": [2, 3, 6, 8, 9, 10, 11, 16, 17, 26, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 70, 72, 75, 89, 92], "model": [2, 9, 72, 73, 74, 85, 86, 87, 89, 90, 91, 92, 93, 94, 97], "model_config": 87, "model_out": 89, "model_save_path": [94, 97], "modelcatalog": [87, 89], "modern": [13, 68], "modifi": [71, 75], "modul": [9, 12, 70, 75, 76, 89, 90, 92, 93], "modular": [77, 81, 96], "momentum": [31, 41], "monitor_gym": 75, "month": 13, "mordatch": 54, "mordatch2017emerg": 54, "more": [1, 2, 3, 7, 9, 10, 25, 27, 30, 31, 37, 39, 45, 46, 47, 49, 54, 61, 68, 70, 71, 74, 77, 78, 80, 87, 88, 89, 90, 91, 92, 93], "most": [6, 8, 9, 10, 13, 27, 42, 49, 54, 70, 71, 90], "mostli": [42, 54], "motion": [35, 54], "move": [4, 6, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 60, 66, 67, 70, 71, 79, 80, 86, 90], "move_down": [56, 58, 59, 60, 61, 62, 63], "move_left": [56, 58, 59, 60, 61, 62, 63], "move_right": [56, 58, 59, 60, 61, 62, 63], "move_up": [56, 58, 59, 60, 61, 62, 63], "moveaxi": [71, 72, 73], "movement": [16, 41, 54, 80], "moving_shield": 30, "mpe": [55, 56, 57, 58, 59, 60, 61, 62, 63, 70, 71, 72, 73], "mpe_environ": 70, "mqueue": 4, "much": [8, 30, 41, 70, 71, 90], "multi": [2, 3, 9, 13, 54, 64, 68, 69, 70, 72, 73, 74, 86, 88, 91, 96], "multi_ag": 87, "multi_agent_replay_buff": [72, 73], "multiag": [3, 55, 64, 68], "multiagentenv": 70, "multiagentpolicymanag": [94, 95, 97], "multiagentreplaybuff": [72, 73], "multibinari": 2, "multidiscret": [2, 79, 80], "multipl": [2, 34, 67, 68, 70, 74, 86], "multiplay": [13, 68], "multipli": [65, 67], "multithread": [92, 93], "multiwalk": [64, 70], "multiwalker_v9": [6, 65], "murtazarang": 70, "must": [2, 3, 6, 9, 10, 14, 22, 23, 27, 28, 29, 32, 34, 35, 39, 40, 41, 43, 44, 46, 47, 49, 52, 54, 57, 58, 60, 61, 65, 66, 67, 71, 79, 80, 90], "mutat": [71, 72, 73], "mutation_sd": [71, 72, 73], "mutual": 2, "mykel": 64, "m\u016b": 68, "n": [2, 4, 8, 9, 12, 40, 43, 46, 49, 56, 61, 71, 72, 73, 75, 76, 79, 80, 87, 90, 94, 97], "n_agent": [72, 73], "n_catch": 66, "n_coop": 67, "n_cycl": 70, "n_episod": [94, 95], "n_evad": [66, 67], "n_obstacl": 67, "n_piston": [41, 89], "n_poison": 67, "n_pursuer": [66, 67], "n_sensor": 67, "n_step": [71, 94, 97], "n_walker": 65, "naddaf": 13, "name": [2, 3, 4, 8, 9, 10, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 70, 71, 75, 78, 79, 80, 86, 87, 89, 90, 92, 93], "namespac": 94, "nan": [4, 8, 12, 70, 75, 76], "nan_noop_v0": 8, "nan_random_v0": 8, "nan_zeros_v0": 8, "narg": [75, 94], "narrow": 21, "natur": [2, 54, 80], "navig": [19, 20, 60, 67], "ncp": 37, "ndarrai": [2, 3, 47], "ne": 43, "necessari": [8, 10, 71, 72, 73, 79, 80], "necessarili": 10, "need": [1, 4, 9, 10, 11, 19, 20, 21, 27, 31, 67, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "neg": [39, 45, 56, 62, 67, 71, 90], "negat": 47, "neighbor": [65, 67], "neighbour": 65, "nest": 2, "net": [12, 35, 75, 76, 94, 97], "net_config": [71, 72, 73], "network": [2, 8, 10, 12, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 71, 72, 73, 75, 76, 87, 94, 97], "neural": [8, 43, 54, 71], "never": [9, 45, 70], "nevertheless": 43, "new": [4, 5, 9, 10, 11, 25, 26, 27, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 68, 70, 71, 72, 73, 83, 85, 90], "new_height": 71, "new_layer_prob": [71, 72, 73], "new_width": 71, "newli": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "newlogprob": [12, 75, 76], "newvalu": 75, "next": [2, 4, 6, 9, 10, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 90, 91], "next_ag": 90, "next_don": 75, "next_ob": [12, 75, 76], "next_stat": [71, 72, 73], "next_termin": 75, "next_trunc": 75, "next_valu": 75, "nextnontermin": 75, "nextvalu": 75, "nhvkkya6qx": 70, "nick": [71, 72], "nicku": [70, 71, 72, 73], "nickua": 73, "nip": 54, "nn": [12, 75, 76, 87, 89], "no_act": [56, 58, 59, 60, 61, 62, 63], "no_grad": [12, 71, 75, 76], "no_mov": 10, "no_mut": [71, 72, 73], "no_op_act": 8, "node": 2, "nois": 65, "noisi": 65, "non": [11, 13, 38, 40, 42, 46, 70, 71, 91], "non_zero": 71, "none": [2, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 97], "noop": 8, "noqa": [75, 86], "norm": [67, 75], "norm_adv": 75, "normal": [8, 11, 12, 30, 33, 40, 63, 65, 71, 72, 75, 76], "normalize_obs_v0": [8, 89], "notabl": [13, 70], "notat": 43, "note": [2, 4, 6, 8, 9, 10, 17, 19, 20, 25, 26, 27, 34, 37, 40, 42, 43, 45, 54, 63, 64, 66, 68, 71, 75, 79, 80, 81, 90, 91, 92, 93], "noth": [27, 34, 40, 54, 86], "notori": 85, "novel": 7, "now": [10, 40, 68, 70, 71, 72, 73, 79, 81, 86], "np": [8, 10, 12, 62, 71, 72, 73, 75, 76, 79, 80, 87, 94, 97], "npc": [24, 37], "nstart": [92, 93], "nth": [2, 9, 46], "num": [75, 94], "num_act": [12, 49, 76], "num_adversari": [62, 63], "num_ag": [2, 3, 6, 9, 12, 72, 73, 76], "num_arch": 40, "num_atom": 71, "num_col": 71, "num_cpu": [75, 92, 93], "num_cycl": [11, 70, 81], "num_env": 75, "num_food": 63, "num_forest": 63, "num_fram": 8, "num_gam": [90, 92, 93], "num_good": [62, 63], "num_gpu": [87, 89], "num_it": 10, "num_knight": 40, "num_minibatch": 75, "num_mov": 10, "num_obstacl": [62, 63], "num_output": [87, 89], "num_play": [14, 22, 28, 35, 50, 51, 70, 86], "num_rollout_work": [87, 89], "num_row": 71, "num_sgd_it": 89, "num_step": [12, 75, 76], "num_sword": 40, "num_upd": 75, "number": [2, 4, 6, 8, 10, 11, 12, 13, 14, 15, 22, 26, 27, 28, 30, 32, 33, 35, 40, 41, 43, 46, 47, 48, 49, 50, 51, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 75, 76, 90, 92, 96], "numer": [40, 70], "numpi": [2, 3, 8, 9, 10, 12, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 87, 94, 97], "nw": 43, "o": [4, 40, 52, 71, 72, 73, 75, 86, 87, 89, 90, 92, 93, 94, 97], "ob": [12, 70, 75, 76, 86, 87, 89, 90, 92, 93], "object": [4, 39, 41, 45, 67, 71, 72, 73], "obs_buff": 86, "obs_len": 87, "obs_messag": 86, "obs_rang": 66, "obs_spac": [87, 89], "obs_typ": 13, "obsdict": 70, "observ": [2, 3, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 66, 68, 69, 70, 71, 72, 73, 76, 79, 80, 85, 86, 87, 89, 90, 91, 92, 93, 94, 97], "observation_s": [12, 76], "observation_spac": [2, 3, 9, 10, 12, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 70, 71, 72, 73, 75, 76, 78, 79, 80, 87, 90, 94, 97], "observation_typ": 47, "observation_vector_dim": 47, "obsolet": 10, "obstacl": [17, 32, 54, 62, 63, 66, 67], "obstacle_coord": 67, "obstacle_radiu": 67, "obstyp": [2, 3, 6], "occasion": 39, "occupi": 43, "occur": 86, "odd": [49, 70], "off": [11, 13, 17, 25, 39, 41, 65, 67, 75, 91], "off_screen_penalti": 39, "offens": 23, "offer": 74, "offici": [9, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 70, 77], "offlin": 71, "offpolicy_train": [94, 97], "often": [2, 10, 13, 54], "old": [8, 10, 12, 26, 71, 76], "old_approx_kl": [12, 75, 76], "oldest": [43, 71], "olymp": [14, 22, 28, 29, 35], "onc": [1, 2, 3, 18, 32, 42, 70, 71], "one": [2, 6, 8, 9, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 60, 68, 70, 71], "one_hot": [71, 72, 73], "ones": [10, 43, 80], "onli": [2, 3, 6, 10, 11, 13, 17, 18, 19, 20, 26, 30, 40, 42, 45, 47, 49, 54, 59, 65, 70, 71, 75, 90, 91, 96], "onlin": 68, "onto": [25, 35], "open": [8, 10, 13, 17, 68, 71, 77, 88], "openai": [8, 13, 54, 86], "openscenario": 68, "openspiel": [2, 47, 70], "openspiel_compat": 7, "openspielcompat": 70, "openspielcompatibilityv0": 7, "oper": [8, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 74], "opp": 71, "opp_three_count": 71, "opp_three_in_row": 71, "opp_update_count": 71, "oppon": [14, 15, 16, 17, 19, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 44, 45, 46, 48, 49, 66, 71, 94], "opponent_difficulti": 71, "opponent_first": 71, "opponent_path": 94, "opponent_pool": 71, "opponent_pool_s": 71, "opponent_upd": 71, "opponent_upgrad": 71, "opponents_hand_vis": 45, "opportun": [25, 37, 71], "oppos": [2, 54], "opposit": [20, 71], "optim": [12, 20, 38, 41, 65, 66, 71, 75, 76, 85, 89, 90, 92, 93, 94, 97], "optimis": [71, 72, 73, 74], "option": [2, 3, 10, 11, 13, 30, 39, 40, 41, 43, 44, 45, 46, 47, 49, 52, 54, 65, 66, 67, 70, 71, 79, 80, 90, 94, 97], "orang": 66, "orchestr": 74, "order": [2, 4, 6, 21, 27, 40, 45, 47, 49, 70, 85, 90, 92], "orderenforcingwrapp": [6, 10], "ordinari": 47, "org": [10, 79, 80, 90], "organ": 64, "orient": [43, 54, 65], "orig_obs_spac": 87, "origin": [4, 6, 8, 13, 43, 54, 64, 70], "orthogonal_": [12, 75, 76], "othello": 13, "othello_v3": 27, "other": [2, 5, 6, 8, 9, 10, 11, 13, 20, 22, 25, 26, 29, 30, 32, 35, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 59, 60, 61, 63, 65, 66, 67, 70, 71, 74, 85], "other_agent_rel_posit": [56, 58, 61, 62, 63], "other_agent_veloc": [62, 63], "other_agents_rel_posit": 56, "otherwis": [6, 21, 39, 43, 47, 90], "our": [1, 2, 6, 9, 10, 12, 13, 43, 45, 46, 48, 51, 70, 71, 76, 81, 83], "out": [4, 6, 11, 12, 15, 32, 39, 54, 68, 70, 71, 72, 73, 74, 75, 76, 78, 89, 90], "outcom": [71, 86], "outperform": 90, "output": [4, 5, 6, 8, 10, 11, 54, 70, 87], "output_kei": 86, "output_pars": 86, "outsid": [2, 3, 4, 6, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 70, 78], "over": [2, 4, 8, 10, 13, 25, 27, 34, 37, 39, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 57, 67, 70, 71, 79, 80, 85, 87], "overal": 41, "overestim": 73, "overhaul": 70, "overhead": 9, "overridden": [10, 79, 80], "overview": 10, "overwrit": [79, 80], "own": [11, 12, 21, 27, 39, 40, 46, 47, 54, 69, 71, 76, 78], "p": [71, 79, 80], "p0_action": 71, "p0_action_mask": 71, "p0_next_stat": 71, "p0_next_state_flip": 71, "p0_state": 71, "p0_state_flip": 71, "p1_action": 71, "p1_action_mask": 71, "p1_next_stat": 71, "p1_next_state_flip": 71, "p1_state": 71, "p1_state_flip": 71, "pa_model": 87, "packag": [1, 7, 8, 10, 65, 70, 71, 78, 94, 95, 97], "pad": [8, 12, 40, 43, 71, 76], "pad_action_space_v0": 8, "pad_observ": 40, "pad_observations_v0": 8, "paddl": [22, 29, 39], "paddle_0": 39, "paddle_1": 39, "page": [13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 70], "pair": 49, "paper": [2, 3, 10, 43, 64, 66, 70, 75, 88, 90, 95], "par_env": 6, "paradigm": [3, 70], "parallel": [2, 5, 8, 12, 43, 44, 45, 46, 47, 48, 50, 51, 52, 68, 69, 70, 72, 73, 74, 75, 76, 78, 83, 88, 89, 93], "parallel_api_test": [3, 11, 70, 81], "parallel_env": [3, 6, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 72, 73, 75, 76, 89, 92, 93], "parallel_env_fn": 11, "parallel_rp": 10, "parallel_seed_test": [11, 70], "parallel_test": 70, "parallel_to_aec": [6, 10, 70, 79, 80], "parallel_to_aec_wrapp": 6, "parallel_wrapper_fn": 70, "parallelenv": [6, 10, 78, 79, 80], "parallelpettingzooenv": 89, "param": [12, 71, 75, 76], "param_group": 75, "paramet": [6, 8, 9, 12, 41, 47, 59, 61, 67, 70, 71, 72, 73, 74, 75, 76, 88, 91, 94, 97], "parametr": 90, "parametricactionsmodel": 87, "pariti": 49, "parrellenv": 70, "pars": [8, 86, 94], "parse_arg": [75, 87, 89], "parse_known_arg": 94, "parser": [75, 87, 89, 94], "part": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 70, 71, 79, 88], "parti": 70, "partial": [2, 3, 11, 68, 70], "particl": [54, 73, 74], "particular": [6, 9, 10, 20, 26, 40, 63, 70], "pass": [4, 8, 9, 10, 11, 22, 23, 26, 40, 46, 70, 78], "passant": [43, 70], "past": [22, 23, 28, 33, 47, 70], "path": [2, 13, 16, 32, 40, 70, 71, 72, 73, 75, 81, 87, 89, 90, 92, 93, 94, 97], "pattern": 8, "pawn": [43, 80], "pbar": 71, "peculiar": 8, "penal": [15, 16, 17, 21, 31, 45, 61, 62, 67, 90], "penalti": [39, 45, 65, 70], "penni": 68, "peopl": 71, "pep": 70, "per": [2, 8, 13, 18, 24, 47, 67, 71, 75, 92, 94], "perfectli": [46, 54], "perform": [8, 47, 54, 70, 71, 72, 73, 74, 75, 77, 90, 91, 94], "performance_benchmark": 11, "permiss": 70, "permit": 70, "permut": [75, 89], "persist": 85, "perspect": [70, 71], "pest": 25, "pettingzoo": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 71, 72, 73, 75, 76, 78, 79, 80, 81, 83, 85, 87, 89, 91, 92, 93, 94, 95, 97], "pettingzoo_ag": 86, "pettingzoo_env": [87, 89, 94, 97], "pettingzoo_env_to_vec_env_v1": [75, 92, 93], "pettingzooag": 86, "pettingzooenv": [87, 89, 94, 95, 97], "pg_loss": [12, 75, 76], "pg_loss1": [12, 75, 76], "pg_loss2": [12, 75, 76], "philosophi": 2, "physic": [11, 31, 41, 65, 68, 70], "pi": 65, "pick": [43, 45], "pickl": 70, "piec": [27, 34, 43, 46, 70, 71, 85], "pieter": 54, "pil": [71, 72, 73, 89], "pile": [45, 47], "pillow": [70, 71, 72, 73, 87, 89], "pimpal": 70, "pip": [1, 7, 8, 9, 10, 13, 38, 42, 54, 64, 70], "piston": [41, 70], "piston_0": 41, "piston_1": 41, "piston_19": 41, "pistonbal": [3, 12, 38, 70, 76, 77, 87, 88], "pistonball_v6": [3, 4, 6, 9, 10, 11, 12, 38, 41, 76, 87, 89], "pixel": [13, 39, 40, 41, 54, 70], "place": [8, 9, 10, 27, 44, 46, 47, 52, 54, 65, 66, 71, 79], "placehold": [71, 72, 73], "placement": [44, 52], "plagu": 8, "plai": [2, 3, 9, 10, 18, 25, 32, 39, 43, 47, 49, 52, 68, 70, 74, 79, 90, 92, 93, 94, 95, 97], "plain": 8, "plan": [25, 26, 32], "plane": [13, 43, 44, 45, 46, 52], "platform": [13, 96], "play_continu": 71, "playabl": 68, "player": [2, 4, 6, 10, 13, 14, 15, 16, 17, 18, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 68, 70, 71, 75, 79, 86, 91, 94], "player1": 4, "player2": 4, "player_": 10, "player_0": [43, 44, 45, 47, 48, 49, 50, 51, 71, 87], "player_1": [43, 44, 45, 47, 48, 49, 50, 51, 52, 71, 87], "player_2": 52, "player_idx": 75, "pleas": [7, 8, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 70, 71, 72, 73, 75, 76, 78, 86, 87, 89, 90, 92, 93, 94, 95, 97], "plot": 75, "plu": [27, 41, 50, 67], "plugin": 1, "point": [9, 14, 15, 16, 17, 18, 21, 22, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 40, 44, 45, 46, 47, 79, 80, 83, 92], "poison": 67, "poison_reward": 67, "poison_spe": 67, "poker": [51, 70, 88], "polici": [2, 3, 4, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 72, 73, 75, 76, 87, 89, 90, 91, 92, 93, 94, 95, 97], "policy_fn": 89, "policy_freq": 73, "policy_loss": 75, "policy_mapping_fn": 87, "pong": [13, 38, 70], "pong_v3": [28, 75], "pool": 71, "poor": [27, 90], "poorli": 90, "pop": [71, 72, 73], "popul": [54, 71, 72, 73], "popular": [8, 42, 68, 88], "population_s": [71, 72, 73], "pose": 8, "posg": [2, 3, 70], "posit": [16, 17, 24, 31, 33, 40, 41, 43, 47, 52, 54, 55, 56, 63, 65, 67, 70, 71, 90, 93], "position_nois": 65, "possibl": [2, 4, 8, 9, 10, 11, 13, 20, 26, 30, 32, 39, 40, 43, 47, 49, 52, 54, 70, 71], "possible_ag": [2, 3, 9, 10, 12, 70, 76, 79, 80, 86, 87, 89, 90, 92, 93], "post": 91, "pot": 51, "potenti": [2, 17, 25, 70], "power": [15, 19, 20, 85], "powerup": 20, "ppo": [12, 68, 77, 87, 88, 91], "ppo_mask": 90, "ppo_pettingzoo_ma_atari": 75, "ppo_pettingzoo_ma_ataripi": 75, "ppo_pistonball_v6_660ce_00000_0_2021": [87, 89], "ppoagent": 89, "ppoconfig": 89, "pr": [9, 70], "practic": [71, 81], "pragmat": 71, "pre": [5, 8, 70, 71, 72, 91, 92, 94], "precis": [13, 15, 18], "predat": 62, "predefin": 8, "predict": [17, 31, 33, 87, 90, 92, 93], "prefer": 8, "prei": 62, "prematur": [19, 20, 24, 25, 26, 36, 37, 40, 65], "prepend": 40, "preprint": [8, 13, 42, 54], "preprocess": 88, "present": 4, "press": [34, 40], "pretrain": [71, 87, 89], "pretrained_path": 71, "pretti": [10, 79, 80], "prevent": [8, 14, 18, 22, 27, 28, 29, 33, 34, 35, 63, 80], "previou": [10, 13, 43, 47, 65, 70, 71, 72, 73, 80], "primarili": 55, "print": [2, 3, 4, 6, 9, 10, 11, 12, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94, 97], "prior": 8, "prior_ep": 71, "priorit": 71, "prioriti": 71, "prison": [7, 68, 70, 79, 80], "prisoner_act": [79, 80], "prisoner_action_mask": 80, "prisoner_i": [79, 80], "prisoner_x": [79, 80], "prisoners_dilemma_in_the_matrix__arena": 7, "privat": 57, "private_kei": 57, "prob": [12, 75, 76], "probabl": [2, 8, 9, 71, 72, 73, 87, 89], "probit": 87, "problem": [8, 13, 65, 68, 69, 70, 71], "problemat": 9, "process": [5, 8, 13, 25, 54, 70, 71, 72, 73, 78, 83, 91, 92], "produc": [11, 13, 67, 91], "product": [59, 63], "profici": 43, "program": 2, "progress": [2, 3, 9, 71], "project": [70, 71, 75, 83], "promot": 43, "proper": [43, 46, 70, 79, 80], "properli": [11, 90], "properti": 65, "proport": [41, 66, 67], "propos": 70, "prospector": 70, "protect": 30, "protocol": [8, 13], "provid": [2, 3, 4, 5, 6, 10, 40, 41, 70, 71, 74, 77, 85, 86, 87, 89, 91, 92, 96, 97], "proxim": [89, 90, 92, 93], "prune": 66, "pseudo": 70, "pt": [71, 72, 73], "pth": [94, 97], "public": [48, 57, 77], "publish": 70, "puck": 23, "pull": 70, "punch": 15, "punish": 54, "pure": [14, 18, 22, 27, 28, 29, 33, 34, 35, 96], "purpl": 67, "purpos": [55, 75, 91], "pursu": 67, "pursuer": [66, 67, 70], "pursuer_0": [66, 67], "pursuer_1": [66, 67], "pursuer_4": 67, "pursuer_7": 66, "pursuer_max_accel": 67, "pursuer_spe": 67, "pursuit": [64, 70], "pursuit_v4": 66, "push": 54, "put": [10, 17], "py": [1, 10, 38, 70, 75, 78, 79, 80, 81, 90], "pybullet": 68, "pydocstyl": 70, "pygam": [38, 40, 41, 68, 70], "pyglet": 70, "pymunk": [40, 41, 70, 93], "pypi": 70, "pyproject": 70, "pyright": 70, "pytest": [1, 70, 90], "python": [1, 9, 43, 69, 70, 88, 94, 95, 96, 97], "python_vers": [71, 72, 73], "pytorch": [71, 72, 87, 91, 96], "pyyaml": [71, 72, 73], "pz": [12, 76], "q": [40, 48, 71, 87, 94, 97], "qmix": [3, 39, 65], "qol": 70, "quadrapong": [13, 70], "quadrapong_v4": 29, "qualiti": [65, 70, 77, 96], "queen": [43, 48], "queensid": 43, "question": [70, 71, 72, 73, 75, 76, 85, 86, 87, 89, 90, 92, 93, 94, 95, 97], "quickli": [19, 20, 21, 25], "quot": 70, "r": [1, 8, 10, 71, 72, 73, 75, 86], "race": [2, 19, 26, 68], "radiu": 67, "raffaelegalliera": 70, "rai": [70, 87, 89], "rainbow": 71, "rais": [6, 10, 41, 48, 50, 51, 79, 80], "ram": 13, "rand_se": [71, 72, 73], "randint": [79, 80], "random": [2, 4, 8, 11, 12, 13, 38, 39, 41, 42, 47, 54, 64, 67, 70, 71, 74, 75, 76, 79, 80, 86, 90, 92, 93, 94, 95, 96, 97], "random_act": 86, "random_demo": 70, "random_drop": [41, 89], "random_oppon": 71, "random_rot": [41, 89], "random_start_play": 47, "randomli": [8, 26, 54, 57, 66, 71, 79], "randompolici": [94, 95, 97], "rang": [8, 10, 12, 41, 47, 67, 71, 72, 73, 75, 76, 90, 92, 93, 94, 97], "rank": [43, 45, 47], "rapid": 23, "rare": [19, 20], "rate": [40, 71, 72, 73, 75, 94], "rather": [2, 8, 9, 70, 92, 93], "ratio": [12, 41, 70, 75, 76], "raw": [70, 90], "raw_env": [9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67], "ray_result": [87, 89], "rb_action": [12, 76], "rb_advantag": [12, 76], "rb_logprob": [12, 76], "rb_ob": [12, 76], "rb_return": [12, 76], "rb_reward": [12, 76], "rb_term": [12, 76], "rb_valu": [12, 76], "re": [13, 70, 90], "reach": [4, 12, 40, 44, 68, 70, 76], "reaction": 8, "read": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70], "readabl": 70, "readi": [71, 72, 73, 78], "readm": [70, 78], "readthedoc": [90, 92, 93], "real": [41, 68, 86], "realist": 41, "reappli": 8, "reason": [9, 10, 11, 54, 71, 90], "rebuild": 1, "recast": 8, "receiv": [2, 3, 4, 9, 14, 20, 22, 26, 27, 28, 29, 30, 33, 35, 36, 39, 45, 47, 48, 49, 51, 52, 54, 62, 65, 66, 67, 86], "recent": [8, 10, 68, 70, 71], "reciproc": 7, "recommend": [8, 10, 13, 71, 72, 73, 75, 76, 81, 83, 86, 87, 89, 90, 92, 93, 94, 95, 97], "reconstruct": [54, 57], "record": [72, 73, 75], "recordvideo": 75, "red": [47, 54, 56, 62, 66, 67], "redesign": [39, 70], "redid": 70, "redtachyon": 70, "reduc": [10, 70, 73, 79, 80, 92], "reduct": [5, 92], "ref": 70, "refactor": [41, 67, 70], "refer": [12, 45, 48, 51, 54, 65, 67, 69, 70, 71, 76, 85, 90], "reflect": 70, "regardless": 47, "regex": 86, "regexpars": 86, "reginald": 70, "region": [8, 40], "regist": [27, 34, 87], "register_custom_model": [87, 89], "register_env": [87, 89], "registri": [87, 89], "regress": 11, "regular": [51, 71], "reinforc": [2, 3, 5, 7, 8, 13, 42, 64, 68, 69, 71, 74, 77, 88, 91, 96], "reinit": [4, 71], "reiniti": 4, "rel": [12, 27, 40, 43, 54, 59, 61, 63, 65, 76, 81], "relat": [9, 40, 54, 70], "releas": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 64, 65, 66, 67, 68], "relev": [10, 40], "reli": 90, "reliabl": [30, 70, 91], "relu": [12, 75, 76, 89], "remain": [6, 39, 47, 71, 90], "remov": [2, 3, 8, 9, 10, 13, 40, 45, 47, 65, 66, 70, 71, 79, 80, 90, 92], "remove_on_fal": 65, "renam": 70, "render": [2, 3, 4, 6, 7, 9, 10, 12, 13, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 76, 78, 79, 80, 87, 89, 90, 92, 93, 94, 95], "render_fp": 70, "render_mod": [2, 3, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 76, 86, 89, 90, 92, 93, 94, 95], "render_result": 11, "render_test": [11, 70], "repeat": [12, 27, 47, 76, 85], "repeat_action_prob": [8, 13], "repeatedli": 71, "repetit": [43, 70], "repl": 86, "replac": [13, 43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 70, 86], "replai": [71, 72, 73], "replay_buff": 71, "replaybuff": 71, "repo": [70, 74, 86], "report": [67, 70], "repositori": [75, 79], "repres": [2, 8, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 67, 69, 71], "represen": 70, "reproduc": [11, 86], "request": 8, "requir": [1, 2, 8, 9, 10, 11, 20, 25, 38, 49, 66, 70, 71, 78, 79, 80, 87, 89, 90, 92, 94, 95, 97], "rescal": [55, 56, 57, 58, 59, 60, 61, 62, 63], "rese": 9, "research": [7, 8, 13, 42, 45, 48, 51, 54, 71, 77], "resembl": 2, "reset": [2, 3, 4, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93], "reshap": [8, 71, 75], "reshape_v0": 8, "resiz": [71, 91, 92], "resize_fram": 71, "resize_v1": [8, 12, 13, 72, 75, 76, 89, 92], "resized_fram": 71, "resolut": [2, 68], "resolv": 70, "resourc": [2, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 71, 87, 89], "respect": [38, 40, 43, 44, 45, 46, 48, 59, 67, 70], "respond": 86, "respons": 15, "rest": 65, "restrict": [2, 3, 13], "result": [2, 8, 10, 11, 40, 54, 64, 67, 70, 71, 75, 90, 92, 94, 95, 97], "resum": 94, "resume_path": 94, "resurect": 70, "ret": 86, "retreiv": 70, "retri": 86, "retriev": [8, 9, 90], "retry_if_exception_typ": 86, "retry_st": 86, "retryerror": 86, "return": [2, 3, 4, 6, 8, 9, 10, 11, 12, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 62, 65, 66, 67, 70, 71, 72, 73, 74, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 97], "return_info": 70, "return_length": 71, "reusabl": [5, 6, 10], "reveal": [47, 48, 49], "revers": [2, 12, 75, 76], "revisit": [8, 13], "rew": [86, 94, 97], "reward": [2, 3, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 69, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93, 94], "reward_list": [72, 73], "reward_map": 10, "reward_metr": [94, 97], "reward_sum": [87, 89], "rewrit": [40, 70], "rgb": [13, 41, 70], "rgb_arrai": [2, 3, 9, 11, 12, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 76, 89], "rgb_imag": 13, "richard": 71, "right": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 42, 43, 54, 65, 66, 71, 79, 80], "right_paddle_spe": [9, 39], "rightmost": [41, 65], "ring": 15, "riot": 68, "rl": [2, 9, 43, 44, 45, 46, 47, 48, 50, 51, 52, 70, 71, 72, 73, 75, 77, 90, 91, 96], "rl_hp": [71, 72, 73], "rl_hp_select": [71, 72, 73], "rlcard": [42, 45, 48, 50, 51, 70], "rlcard_env": [45, 48, 50, 51], "rllib": [3, 68, 70], "rllib_leduc_holdem": 87, "rllib_num_gpu": [87, 89], "rnd": 70, "robber": 26, "robot": [7, 65], "robust": 70, "rock": [2, 3, 10, 70, 88, 90, 95], "rock_paper_scissor": 86, "rohan": [87, 89], "rohan138": [87, 89], "role": 68, "rollout": [75, 87, 89], "rollout_fragment_length": [87, 89], "rollov": [12, 76], "rom": [13, 70, 75], "rom_path": [13, 75], "rook": 43, "room": [2, 32], "root": [2, 81], "rotat": [40, 65], "round": [48, 50, 51, 70, 90], "round_reward": 90, "row": [8, 27, 40, 43, 45, 46, 71], "row_count": 71, "rp": [42, 49, 70], "rps_v2": [2, 10, 49, 86, 95], "rstrip": 75, "rule": [27, 43, 71, 86], "rummi": [42, 70], "run": [1, 2, 3, 4, 11, 12, 17, 25, 32, 62, 67, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "run_nam": 75, "ruzh": 42, "ryan": 54, "sabotag": 30, "safe_load": 71, "samaritan": 68, "same": [3, 8, 11, 18, 29, 39, 40, 41, 43, 44, 45, 46, 47, 49, 52, 65, 66, 67, 70, 71, 74, 81, 86, 90, 93], "sampl": [2, 3, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 71, 72, 73, 75, 76, 86, 90, 92], "sane": 10, "satisfi": 47, "save": [12, 46, 71, 72, 73, 76, 89, 90, 92, 93, 94, 97], "save2memori": [72, 73], "save2memoryvectenv": 71, "save_al": 89, "save_best_fn": [94, 97], "save_cod": 75, "save_dir": 4, "save_ob": 70, "save_observ": 4, "save_path": [71, 72, 73], "savecheckpoint": [71, 72, 73], "say_0": [57, 59, 60, 63], "say_1": [57, 59, 60, 63], "say_2": [57, 59, 60, 63], "say_3": [57, 59, 60, 63], "say_4": [59, 60], "say_5": [59, 60], "say_6": [59, 60], "say_7": [59, 60], "say_8": [59, 60], "say_9": [59, 60], "sb3": [70, 91], "sb3_connect_four_action_mask": 90, "sb3_contrib": 90, "sb3actionmaskwrapp": 90, "scalabl": 68, "scalar": [47, 49], "scale": [8, 41, 54, 65, 67, 88], "scale_actions_v0": 8, "scenario": [7, 38, 68], "scenariorunn": 68, "scene": 54, "scenic": 68, "schema": 86, "scheme": [6, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 70], "scipi": 70, "scissor": [2, 3, 10, 70, 88, 90, 95], "scope": 78, "score": [13, 14, 15, 16, 17, 18, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 33, 35, 37, 45, 47, 71, 72, 73, 90], "scratch": [77, 83], "screen": [13, 20, 30, 32, 39, 40, 41, 55, 56, 57, 58, 59, 60, 61, 62, 63, 67, 70], "screen_height": [43, 45, 46, 48, 49, 50, 51, 52], "screen_scal": 44, "script": [1, 70, 75, 90, 92, 93, 96], "sdl_videodriv": [87, 89], "se": 43, "search": [21, 71, 72], "second": [2, 9, 11, 14, 18, 22, 27, 28, 29, 33, 34, 35, 43, 46, 52, 54, 66, 71, 73, 90, 91, 92, 95], "second_0": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "secondari": 3, "section": [20, 43, 44, 45, 46, 47, 48, 50, 51, 52, 66, 70, 71], "secur": [68, 70], "see": [2, 3, 4, 7, 8, 10, 13, 19, 20, 38, 47, 54, 55, 56, 63, 70, 71, 75, 77, 83, 85, 87, 88, 89, 90, 91, 92, 93], "seed": [2, 3, 4, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 69, 70, 75, 76, 78, 79, 80, 90, 92, 93, 94, 97], "seed_test": [11, 70], "seem": 90, "seen": [43, 63], "seer": 47, "select": [2, 4, 9, 10, 12, 18, 34, 41, 66, 70, 71, 72, 73, 76, 85, 86], "self": [2, 10, 12, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 68, 70, 74, 75, 76, 78, 79, 80, 86, 87, 89, 90], "self_in_forest": 63, "self_po": [61, 62, 63], "self_vel": [55, 58, 59, 60, 61, 62, 63], "sens": [8, 67], "sensor": [65, 67], "sensor_rang": 67, "sent": [21, 57], "separ": [9, 11, 71, 81, 90], "seq_len": [87, 89], "sequenc": [2, 13, 40, 44, 45, 85], "sequence_spac": 40, "sequenti": [2, 12, 46, 69, 70, 75, 76, 89], "serial": [47, 70], "serv": [14, 22, 28, 29, 33, 35, 70, 71], "server": [70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "set": [5, 6, 8, 9, 10, 11, 13, 17, 26, 38, 40, 41, 42, 43, 44, 45, 47, 50, 51, 54, 63, 64, 65, 67, 70, 71, 73, 79, 80, 86, 92, 93], "set_ep": [94, 97], "set_postfix_str": 71, "set_random_se": 90, "setup": [12, 70, 78], "seventh": 43, "sever": [40, 54], "sgd_minibatch_s": 89, "shahofblah": 70, "shape": [8, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 72, 73, 75, 76, 87, 94, 97], "share": [8, 30, 66, 88, 91], "shared_reward": [65, 66], "shelf": 91, "shield": 30, "shift": 30, "shimmi": [2, 5, 47, 68, 70], "shimmy2022github": 7, "ship": 30, "shoot": 40, "short": 78, "shorter": 74, "shot": 18, "should": [2, 4, 6, 9, 10, 11, 18, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67, 71, 72, 73, 75, 76, 78, 79, 80, 86, 87, 89, 90, 92, 93, 94, 95, 97], "show": [2, 12, 47, 49, 52, 71, 72, 73, 75, 76, 77, 87, 88, 89, 90, 91, 92, 93, 95, 97], "shown": [6, 51, 66, 71, 72, 73, 74, 75, 76, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "shuffl": [12, 75, 76], "side": [14, 20, 22, 27], "signal": [54, 57, 65, 70], "signifi": 43, "signific": [8, 47, 70, 71], "significantli": [70, 74, 92, 93], "similar": [2, 3, 5, 6, 9, 10, 31, 43, 46, 51, 60, 63, 69], "similarli": [52, 67], "simpl": [2, 3, 5, 6, 8, 9, 10, 39, 41, 47, 52, 54, 69, 73, 74, 77, 86, 88, 91, 95], "simple_adversari": 56, "simple_adversary_v3": [55, 56, 70], "simple_crypto": 57, "simple_crypto_v3": 57, "simple_env": 70, "simple_push": 58, "simple_push_v3": 58, "simple_refer": [59, 60, 70], "simple_reference_v3": 59, "simple_speaker_listen": 60, "simple_speaker_listener_v4": [60, 73], "simple_spread": [61, 70], "simple_spread_v3": 61, "simple_tag": [62, 63], "simple_tag_v3": [54, 62], "simple_v3": 55, "simple_world_comm": 63, "simple_world_comm_v3": 63, "simpleenv": 70, "simpler": [2, 43, 83, 90], "simplest": 4, "simpli": [11, 49, 70, 71, 86], "simplic": 81, "simplifi": [8, 68], "simul": [65, 67, 68, 86], "simultan": [2, 3, 49, 59, 69, 78], "sinc": [8, 9, 25, 49, 54], "singl": [2, 8, 9, 11, 20, 43, 47, 55, 65, 66, 68, 70, 71, 77, 85, 90, 91, 92, 93], "single_act": 87, "single_action_spac": 75, "single_observation_spac": 75, "singular": 70, "sisl": [6, 65, 66, 67, 70, 93], "site": 70, "situat": 7, "six": [48, 70, 85], "size": [8, 40, 46, 47, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 66, 67, 70, 71, 72, 73, 94, 97], "skill": 71, "skip": [8, 13, 86, 90], "skyjo": 68, "slightli": [45, 71], "slope": 71, "slow": 70, "slower": 62, "slowli": [32, 71], "small": [9, 39, 43, 47, 63, 65, 70, 71], "smaller": [71, 90, 94], "smoother": 70, "so": [6, 8, 9, 10, 11, 13, 27, 29, 30, 32, 35, 41, 43, 47, 52, 54, 62, 68, 70, 71, 75, 79, 80, 86, 90, 92, 93], "social": 7, "soft": [71, 72, 73], "softwar": [7, 96], "sole": 42, "solv": [27, 71], "solvabl": 90, "some": [2, 3, 5, 9, 10, 11, 13, 14, 16, 17, 22, 26, 28, 30, 35, 54, 70, 71, 80, 85, 86], "somehow": 30, "someth": [40, 87, 89], "sometim": [13, 51, 54, 71], "songyi": 42, "soon": 40, "sophist": 71, "sort": 8, "sound": 71, "sourc": [2, 3, 4, 6, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68, 85, 88], "sp": 75, "space": [2, 3, 4, 6, 8, 9, 10, 13, 38, 39, 40, 41, 42, 55, 56, 57, 58, 59, 60, 61, 62, 63, 66, 68, 70, 71, 72, 73, 75, 79, 80, 87, 90, 91, 92, 93, 94, 97], "space_invad": [30, 72], "space_invaders_v2": [8, 13, 30, 72], "space_war": 31, "space_war_v2": 31, "spade": [45, 50, 51], "spawn": [4, 40, 41, 66, 91, 92], "spawn_rat": 40, "speak": 60, "speaker": [54, 59, 73, 74], "speaker_0": 60, "speaker_listen": 73, "special": 9, "specif": [2, 3, 8, 14, 16, 17, 22, 26, 28, 29, 30, 35, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 61, 65, 66, 67, 68, 70, 71, 72, 73, 75, 85], "specifi": [2, 4, 8, 9, 10, 13, 38, 39, 40, 41, 43, 44, 45, 46, 48, 49, 50, 51, 52, 54, 65, 66, 67, 71, 72, 73, 75, 79, 80], "speed": [16, 39, 65, 67, 92, 93, 96], "speed_featur": 67, "speedup": 70, "sphinx": [1, 70], "split": 56, "spock": [49, 70], "spot": 43, "spread": 54, "springer": 64, "sprite": 13, "sqrt": [12, 75, 76], "squar": [21, 40, 43, 70], "squeez": [72, 73], "ss": [72, 75, 89, 92, 93], "ssd": 68, "stab": 40, "stabil": [71, 72], "stabl": [70, 90, 92, 93], "stable_baselines3": [90, 92, 93], "stack": [5, 8, 12, 43, 46, 76, 91, 92], "stack_siz": [12, 76], "stag": 68, "stage": [2, 18, 20, 71], "stai": [39, 41, 66, 92], "stall": [14, 18, 22, 27, 28, 29, 33, 34, 35, 70], "stand": [36, 44], "standalon": 70, "standard": [2, 3, 4, 8, 11, 13, 46, 47, 49, 51, 69, 70, 85, 96], "stanford": 64, "start": [2, 8, 10, 21, 30, 39, 40, 41, 43, 44, 46, 47, 49, 52, 54, 65, 66, 67, 70, 71, 72, 73, 75, 76, 79, 80, 83, 90, 92, 93], "start_dim": [12, 76], "start_tim": 75, "state": [2, 3, 4, 6, 9, 10, 39, 40, 41, 43, 44, 46, 47, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 79, 80, 85, 87, 89, 91], "state_dict": [71, 94, 97], "state_dim": [71, 72, 73], "state_out": 87, "state_shap": [94, 97], "state_spac": [9, 70], "static": [2, 4, 54, 70], "stationari": 71, "std": [12, 75, 76], "steal": 25, "step": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 78, 79, 80, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "step_per_collect": [94, 97], "step_per_epoch": [94, 97], "stick": 8, "sticki": [8, 27], "sticky_act": 13, "sticky_actions_v0": [8, 13], "still": [10, 26, 40, 41, 49, 71], "stochast": [2, 3], "stone": 46, "stop": [4, 71, 72, 73, 86, 87, 89], "stop_after_attempt": 86, "stop_fn": [94, 97], "storag": [12, 75, 76], "store": [2, 9, 10, 47, 71, 78], "store_tru": 94, "str": [2, 3, 4, 10, 11, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 66, 70, 71, 75, 90, 92, 93, 94], "straight": 40, "strategi": [18, 27, 30, 32, 34, 52, 71], "streamlin": [70, 74], "strength": [71, 72, 73], "strftime": [71, 90, 92, 93], "stride": [71, 72, 75, 89], "stride_s": [71, 72], "string": [2, 3, 4, 6, 8, 9, 10, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70], "strip": 90, "strong": 71, "strong_rule_based_oppon": 71, "strongli": 10, "strtobool": 75, "structur": [2, 9, 40, 65, 70, 79, 83, 86], "stubborn": 7, "stuck": [19, 20], "studi": [9, 13, 43], "style": [12, 34, 43, 46, 70, 71, 76], "sub": 91, "subclass": 86, "subprocess": [2, 10, 39, 40, 41, 43, 44, 46, 47, 49, 52, 65, 66, 67], "substanti": 70, "substrat": 7, "substrate_nam": 7, "succe": 22, "success": [15, 18, 54, 71], "successfulli": [1, 27, 44, 70, 71], "suffici": 8, "suggest": 70, "suit": [7, 45, 48, 81], "sum": [4, 14, 18, 22, 24, 25, 27, 28, 29, 33, 34, 35, 47, 54, 61, 71, 72, 73, 86, 90, 92, 93], "sum_of_reward": 86, "summar": 85, "summarywrit": [75, 94], "super": [12, 75, 76, 86, 90], "superior": [70, 73], "supersuit": [5, 10, 12, 13, 70, 71, 72, 73, 75, 76, 87, 88, 89, 91, 92, 93], "support": [2, 3, 4, 6, 8, 9, 10, 11, 13, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 68, 69, 70, 71, 75, 90, 91, 92], "suppress": 4, "suppress_output": 4, "sure": [11, 81], "surprisingli": 8, "surrog": 75, "surround": [13, 41, 46, 66], "surround_v2": 32, "surviv": 67, "sushant1212": 70, "sutton": 71, "svg": 11, "sw": 43, "swap": [52, 71, 72, 73], "swap_channel": [72, 73], "swing": 40, "switch": [2, 9, 23, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70], "sword": 40, "symmetr": 20, "sync_tensorboard": 75, "system": [4, 9, 10, 13, 24, 31, 43, 46, 54, 64, 71], "systemmessag": 86, "t": [8, 9, 10, 12, 30, 33, 47, 56, 62, 70, 75, 76, 90], "tabl": [26, 49, 65, 67], "tac": [70, 94, 97], "tag": [54, 66, 70], "tag_reward": 66, "tai": 7, "take": [2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 18, 27, 34, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 71, 72, 73, 79, 80, 85, 86, 90, 91, 92, 93], "taken": [2, 9, 31, 47, 49, 71, 80], "taller": 8, "talli": 27, "talviti": 13, "tamar": 54, "tank": 13, "target": [47, 56, 59, 67, 71, 72, 73, 75, 94], "target_kl": 75, "target_update_freq": [94, 97], "task": [71, 77], "tau": [71, 72, 73], "td": 71, "teach": 71, "team": [7, 18, 22, 29, 35, 54, 57, 75], "team_siz": 7, "teammat": 20, "technic": 70, "techniqu": [71, 74], "teleport": 39, "tell": [8, 10, 11, 47, 86, 91], "temperatur": 86, "temporarili": [54, 70], "tenac": 86, "tenni": 13, "tennis_v3": 33, "tensor": [12, 75, 76, 87], "tensorboard": [70, 75, 76, 77, 94], "tensorboardlogg": 94, "tensorflow": [87, 89], "term": [12, 27, 43, 76, 86], "term_pursuit": 66, "termin": [2, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93], "terminate_on_fal": 65, "terminate_reward": 65, "terminateilleg": 70, "terminateillegalwrapp": [6, 7], "termini": 86, "terrain": 65, "terrain_length": 65, "terri": [7, 8, 13], "territori": 46, "terry2020arcad": 13, "test": [4, 7, 10, 70, 71, 72, 73, 75, 76, 78, 83, 92, 94, 96], "test_action_flex": 70, "test_action_mask_easi": 90, "test_action_mask_hard": 90, "test_action_mask_medium": 90, "test_collector": [94, 97], "test_env": [87, 94, 97], "test_fn": [94, 97], "test_in_train": [94, 97], "test_kept_st": 11, "test_num": 94, "test_save_ob": 11, "texa": [42, 48, 70, 90], "texas_holdem": 50, "texas_holdem_no_limit": [51, 86], "texas_holdem_no_limit_v6": [51, 86, 90], "texas_holdem_v4": [50, 90], "text": [2, 70, 71, 72, 73, 85, 86], "text_color": [71, 72, 73], "th": [43, 94], "than": [8, 46, 49, 51, 70, 71, 80, 90, 92, 93], "thank": 70, "thei": [9, 10, 11, 12, 14, 15, 17, 20, 26, 27, 28, 30, 33, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 57, 61, 62, 65, 66, 67, 70, 71, 76], "them": [6, 9, 11, 24, 25, 27, 30, 34, 41, 42, 54, 56, 65, 70, 71, 85, 92], "theme": 70, "themikeste1": 70, "themselv": 85, "theoret": [13, 68], "theori": [2, 68], "therefor": [49, 67, 71], "thermomet": 47, "thi": [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "thing": 70, "think": [27, 71, 78, 79], "third": [46, 66, 70], "third_0": [22, 29, 35, 36], "third_party_env": 70, "thorough": 96, "those": [45, 47, 64, 71], "though": [9, 10, 54, 83], "thought": [2, 70], "three": [13, 43, 51, 64, 70, 71], "three_in_row": 71, "three_in_row_count": 71, "threshold": 75, "through": [2, 3, 6, 9, 10, 11, 17, 19, 20, 21, 26, 70, 71, 72, 73, 74, 78, 85], "throw": [47, 70], "thrust": 67, "thrust_penalti": 67, "thu": [9, 41, 58, 94, 95, 97], "ti": 90, "tianshou": 70, "tic": [70, 94, 97], "tic_tac_to": [86, 94], "tictacto": [42, 52, 70], "tictactoe_v3": [6, 52, 86, 90, 94, 97], "tie": [2, 90], "tier": 39, "tiger_d": 70, "tight": 77, "time": [1, 2, 4, 6, 8, 9, 10, 14, 16, 18, 22, 23, 24, 26, 27, 28, 29, 30, 33, 34, 35, 37, 39, 40, 41, 42, 44, 48, 49, 51, 63, 65, 66, 67, 68, 70, 71, 74, 75, 79, 80, 86, 90, 92, 93], "time_penalti": [41, 89], "timelin": 53, "timer": [14, 18, 22, 27, 28, 29, 33, 34, 35, 70], "timestamp": [79, 80], "timestep": [6, 39, 65, 75, 77, 79, 80, 87, 90], "timesteps_tot": [87, 89], "titl": [7, 8, 13, 42, 54, 64], "to_dict": [87, 89], "to_parallel": 70, "tobirohr": 70, "todo": [75, 87, 90], "toe": [70, 94, 97], "togeth": [30, 47, 54, 67], "toggl": [66, 67, 75], "token": [27, 44, 47], "tolist": 71, "toml": 70, "too": 71, "took": [47, 70], "tool": [13, 69, 85], "toolkit": 42, "top": [1, 30, 40, 45, 46, 65, 66, 71, 79], "torch": [12, 71, 72, 73, 75, 76, 87, 89, 94, 97], "torch_determinist": 75, "torch_modelv2": 89, "torch_util": 87, "torchfc": 87, "torchmaskedact": 87, "torchmodelv2": 89, "toreset": 70, "total": [20, 39, 40, 46, 47, 59, 63, 65, 70, 71, 72, 73, 75, 90], "total_episod": [12, 71, 76], "total_episodic_return": [12, 76], "total_reward": 90, "total_step": 71, "total_timestep": [75, 90, 92, 93], "touch": [40, 66, 67], "tournament": [46, 71, 72, 73], "tournament_s": [71, 72, 73], "tournamentselect": [71, 72, 73], "toward": [10, 29, 35, 36, 41, 43, 65], "tower": 7, "tqdm": [71, 72, 73], "track": [16, 47, 71, 75, 77, 78, 90, 91], "tracker": 71, "tradit": [22, 74, 85], "traffic": 68, "trail": 32, "train": [3, 4, 12, 39, 43, 65, 68, 70, 74, 75, 76, 77, 91, 94, 95, 96], "train_action_mask": 90, "train_actions_dict": 71, "train_actions_hist": 71, "train_ag": 94, "train_batch_s": [87, 89], "train_butterfly_supersuit": 93, "train_collector": [94, 97], "train_env": [94, 97], "train_fn": [94, 97], "trainer": [94, 97], "training_num": [94, 97], "trang": [71, 72, 73], "transform": [5, 8, 10, 46], "transient": 70, "transit": [9, 12, 71, 76], "transmit": 54, "transpos": [12, 76], "trap": 27, "travel": 21, "travers": 26, "treat": [8, 9, 71], "tree": 2, "tri": [10, 11], "trigger": 8, "troubleshoot": 70, "true": [4, 8, 9, 13, 16, 17, 30, 39, 40, 41, 45, 47, 54, 65, 66, 67, 70, 71, 72, 73, 75, 79, 80, 86, 89, 90, 92, 93, 94, 97], "truetyp": 71, "trunc": [12, 76, 86], "truncat": [2, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 72, 73, 75, 76, 79, 80, 86, 87, 89, 90, 92, 93], "trust": 7, "try": [2, 3, 14, 29, 30, 32, 35, 57, 67, 71, 72, 73, 75, 79, 86, 90, 92, 93], "try_import_torch": 87, "ttf": 71, "ttt": 97, "tunabl": 68, "tune": [77, 87, 89, 90], "tupl": [2, 3, 8, 94, 97], "turn": [2, 4, 6, 8, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 67, 69, 70, 71, 87], "turns_per_episod": 71, "tut": 70, "tutori": [2, 3, 10, 68, 70, 71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "tutorial2_adding_game_log": 81, "tutorial3_action_mask": 81, "tv": 8, "twin": 73, "two": [3, 8, 11, 13, 15, 18, 22, 23, 25, 28, 29, 30, 39, 40, 41, 43, 45, 46, 49, 51, 65, 67, 70, 71, 79, 90, 91, 95], "txt": [1, 78], "type": [2, 3, 6, 8, 10, 11, 40, 43, 47, 70, 71, 75, 85, 87, 90, 94, 96, 97], "type_onli": [8, 75], "typemask": 40, "typevar": 70, "typic": [2, 3, 9, 10, 54, 67], "typo": 70, "t\u014drere": 68, "u": [1, 40, 71], "ui": 68, "uint8": 8, "ultim": 71, "umutucak": 70, "unari": 47, "unbatchifi": [12, 76], "unchang": 39, "uncom": 71, "under": [65, 70], "underli": [2, 6, 9, 70], "underneath": 9, "underpromot": 43, "understand": [10, 71, 72, 73, 75, 76, 78, 79, 86, 87, 89, 90, 92, 93, 94, 95, 97], "undertak": 71, "unexpect": 70, "unfamiliar": 7, "unforgiv": 24, "uniformli": 54, "unintent": 70, "union": 51, "uniqu": [13, 38, 42, 54, 64], "unit": [40, 41, 54, 66, 71], "uniti": 68, "unknown": 45, "unless": [17, 26, 90, 92], "unlik": [33, 43, 71], "unlimit": 71, "unmaintain": 70, "unnecessari": 70, "unpredict": 40, "unscal": 56, "unsuit": 4, "unsuppress_output": 4, "unsur": [2, 3], "until": [4, 10, 13, 44, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 71, 85], "unwrap": [70, 86, 90, 92, 93], "up": [8, 9, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 41, 43, 45, 54, 56, 66, 70, 71, 74, 79, 80, 92, 93], "upcom": 70, "updat": [2, 3, 6, 8, 10, 70, 71, 72, 73, 75, 79, 80, 90, 94], "update_epoch": 75, "update_per_step": [94, 97], "update_top": 71, "upgrad": [45, 48, 50, 51, 70], "upleft": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37], "upper_bound": [8, 72, 75], "upright": [15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 31, 33, 37], "upstream": 70, "urgency_reward": 66, "url": 7, "us": [2, 3, 4, 6, 7, 8, 9, 11, 12, 13, 19, 20, 21, 38, 39, 40, 41, 42, 43, 45, 46, 47, 48, 51, 54, 57, 64, 67, 69, 70, 75, 76, 78, 79, 80, 81, 84, 85, 86, 87, 89, 90, 91, 92, 93, 94, 95, 97], "usabl": 70, "usag": [4, 11, 70, 96], "use_ga": 89, "use_typemask": 40, "user": [2, 10, 11, 12, 38, 74, 76, 77], "usual": [43, 44, 45, 46, 47, 48, 50, 51, 52, 78], "util": [2, 3, 5, 7, 9, 11, 69, 70, 71, 72, 73, 75, 85, 87, 90, 91, 94, 97], "uuid": 47, "v": [67, 71, 87, 89, 90, 92, 93, 97], "v0": [10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67], "v1": [10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67, 70, 79, 80, 91], "v10": [10, 40], "v2": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 67], "v3": [14, 18, 19, 20, 22, 24, 25, 26, 27, 28, 29, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 50, 51, 52, 65, 66, 67], "v4": [29, 34, 39, 40, 41, 43, 45, 46, 47, 48, 50, 51, 65, 66, 67], "v5": [39, 40, 41, 43, 46, 47, 51, 65, 70], "v6": [40, 41, 43, 51, 65, 70], "v7": [40, 65], "v8": [40, 65], "v9": 40, "v_clip": [12, 75, 76], "v_loss": [12, 75, 76], "v_loss_clip": [12, 75, 76], "v_loss_max": [12, 75, 76], "v_loss_unclip": [12, 75, 76], "v_max": 71, "v_min": 71, "vacuou": 9, "valid": [2, 5, 6, 10, 27, 86], "valid_action_instruct": 86, "valid_posit": 71, "valu": [3, 4, 6, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 70, 71, 72, 73, 75, 76, 79, 90, 92, 93], "value_fn": 89, "value_funct": [87, 89], "value_loss": 75, "valueerror": [86, 90, 92, 93], "var": [4, 12, 75, 76], "var_i": [12, 75, 76], "vareiti": 10, "vari": [43, 70, 90, 92, 93], "variabl": [2, 4, 10, 40, 70], "variable_env_test": 2, "varianc": [8, 12, 76], "variat": [13, 48, 51], "varieti": [24, 69, 71], "variou": [7, 13, 65, 66, 67, 70], "ve": 64, "vector": [8, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 65, 67, 70, 91, 92, 93, 95], "vector_st": [40, 92], "vectoris": 95, "vectoriz": 40, "vectorreplaybuff": [94, 97], "vehicl": 68, "veloc": [54, 65, 67, 70], "veness": 13, "verbos": [90, 92, 93], "verbose_progress": 11, "veri": [9, 27, 38, 47, 68, 74, 78], "versa": 54, "version": [4, 7, 10, 11, 13, 67, 70, 71, 78, 87, 94, 95, 97], "vertic": [41, 44, 52, 67, 71], "vertical_thrust": 67, "vertical_win": 71, "vf": 75, "vf_coef": [12, 75, 76], "vf_loss_coeff": 89, "via": [3, 8, 9, 10, 13, 38, 42, 54, 64, 65, 68, 70, 78, 97], "vice": 54, "video": [13, 14, 22, 28, 29, 35, 68, 70, 71, 72, 73, 75, 77], "video_check": 34, "video_checkers_v4": 34, "view": [3, 39, 47, 65, 75, 77, 87, 89, 96], "virtual": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "visibilty_level": 26, "visibl": [26, 54], "visit": 70, "visual": [11, 38, 41, 70, 91, 92], "visual_observ": 92, "visualis": [71, 72, 73], "vloss": 75, "volleybal": 13, "volleyball_pong": [35, 70], "volleyball_pong_v2": 35, "volleyball_pong_v3": 35, "volum": 13, "vulner": 43, "vwxyzjn": 75, "w": [39, 40, 41, 43, 71, 72, 73], "wa": [2, 4, 8, 10, 12, 13, 20, 41, 47, 64, 68, 70, 76, 80, 86], "wafer": 25, "wai": [2, 8, 13, 25, 62, 71, 80, 85], "wait": [71, 86], "wait_non": 86, "walk": [10, 40, 83], "walker": 65, "walker_0": 65, "walker_1": 65, "walker_2": 65, "walkthrough": 10, "wall": [17, 20, 26, 32, 41, 66, 80], "wandb": [70, 71, 72, 73, 75], "wandb_dict": 71, "wandb_ent": 75, "wandb_project_nam": 75, "wander": 54, "want": [6, 8, 9, 12, 59, 76], "war": 13, "warlord": [13, 37], "warlords_v3": 36, "warm": 71, "warm_up_oppon": 71, "warmup": 71, "warn": [4, 6, 8, 10, 11, 70, 79, 80, 86], "warn_action_out_of_bound": 4, "warn_on_illegal_mov": 4, "warn_step_after_terminated_trunc": 4, "warp": 71, "wasd": 38, "watch": [90, 92, 93, 94], "waterworld": [64, 70, 88, 91], "waterworld_v4": [64, 67, 70, 93], "wave": 24, "wb": 71, "wd": 70, "we": [2, 3, 6, 9, 10, 11, 12, 13, 43, 64, 70, 71, 76, 78, 79, 80, 81, 86, 90, 91, 92, 93], "weak": 71, "weak_rule_based_oppon": 71, "webassembli": 68, "webgl": 68, "websit": [2, 3, 70], "wed": 39, "wei": 42, "weight": [12, 41, 59, 61, 75, 76, 77], "weird": 9, "welcom": [70, 78], "well": [24, 37, 40, 47, 49, 65, 70, 90], "were": [13, 39, 40, 46, 47, 54, 70, 71], "what": [8, 11, 12, 40, 43, 47, 70, 74, 76, 90], "whatev": 90, "when": [4, 6, 8, 9, 10, 11, 12, 13, 16, 17, 20, 23, 24, 26, 27, 30, 31, 33, 36, 37, 39, 40, 44, 47, 54, 63, 65, 66, 67, 70, 71, 73, 74, 76, 90], "whenev": [2, 4, 15, 16, 17, 19, 31], "where": [1, 2, 3, 4, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 78, 79, 86, 91], "wherea": 2, "whether": [16, 40, 43, 44, 45, 46, 47, 48, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 71, 75, 85], "which": [2, 3, 4, 5, 6, 8, 10, 11, 12, 13, 15, 18, 27, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 56, 57, 59, 65, 66, 67, 70, 71, 76, 80, 85, 86, 87, 90, 92, 95], "while": [3, 4, 6, 7, 8, 9, 10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 46, 49, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 69, 71, 76, 90], "white": [43, 46, 47, 66, 70], "white_0": 46, "who": [45, 70, 71], "whole": 40, "whose": [43, 44, 45, 46, 47, 48, 50, 51, 52, 67], "why": 4, "wide": [10, 40, 68, 69], "width": [12, 40, 71, 76], "willdudlei": [70, 94, 95, 97], "win": [26, 27, 34, 42, 48, 49, 71, 94], "win_rat": [71, 94], "window": [2, 3, 9, 10, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 66, 67, 70], "winnabl": 71, "winner": [43, 45, 46, 48, 49, 50, 51, 52, 90], "winning_act": 71, "winrat": 90, "wise": 13, "wish": [8, 10, 71, 87], "within": [6, 8, 9, 13, 14, 22, 28, 29, 33, 35, 39, 45, 47, 67, 78], "without": [9, 10, 20, 65, 70, 71, 72, 73, 75, 76, 79, 80, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "wizard": 13, "wizard_of_wor": [36, 37], "wizard_of_wor_v3": 37, "won": [9, 10, 33], "wor": 13, "word": 40, "work": [4, 8, 20, 25, 30, 45, 47, 48, 51, 54, 65, 67, 70, 81, 85, 90, 91], "workflow": 70, "world": [24, 40, 54, 66, 71], "worri": 71, "worth": [30, 71], "would": [2, 3, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 70, 71, 78], "wrap": [6, 7, 9, 10, 45, 48, 51, 70, 90, 95], "wrapped_env": 10, "wrapper": [2, 3, 4, 9, 13, 46, 68, 70, 71, 75, 87, 89, 90, 92], "writer": [75, 94], "written": [70, 96], "wrong": 43, "wu": 54, "www": 70, "x": [8, 12, 40, 41, 43, 46, 52, 59, 62, 63, 65, 66, 67, 75, 76, 79, 80, 86], "x11": 40, "x5": 40, "x_size": [8, 66, 72, 75, 89, 92], "xdist": 70, "xia": 42, "xixinzhang": 70, "y": [8, 13, 40, 43, 46, 65, 67, 71, 79, 80, 90, 92, 93], "y_pred": [12, 75, 76], "y_size": [8, 66, 72, 75, 89, 92], "y_true": [12, 75, 76], "yaml": 71, "yank": 70, "ye": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67], "year": [7, 8, 13, 42, 54, 64, 70], "yellow": 47, "yet": [8, 49], "yi": 54, "yield": [9, 90], "you": [1, 2, 3, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 75, 76, 78, 83, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 97], "younik": 70, "your": [2, 3, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 69, 71, 72, 73, 75, 78, 79, 80, 83, 86, 87, 89], "yourself": [19, 20, 26], "yuanpu": 42, "zealand": 68, "zero": [4, 8, 12, 14, 18, 22, 27, 28, 29, 33, 34, 35, 42, 43, 44, 45, 46, 47, 48, 50, 51, 52, 54, 57, 65, 70, 71, 75, 76, 80, 88, 90], "zero_grad": [12, 75, 76], "zeros_lik": [12, 71, 75, 76], "zha": 42, "zha2019rlcard": 42, "zigzaging_bomb": 30, "zip": [10, 90, 92, 93], "zombi": [2, 4, 19, 20, 38, 70, 91]}, "titles": ["404 - Page Not Found", "PettingZoo docs", "AEC API", "Parallel API", "Utils", "Wrappers", "PettingZoo Wrappers", "Shimmy Compatibility Wrappers", "Supersuit Wrappers", "Basic Usage", "Environment Creation", "Testing Environments", "Tutorials", "Atari", "Basketball Pong", "Boxing", "Combat: Plane", "Combat: Tank", "Double Dunk", "Emtombed: Competitive", "Emtombed: Cooperative", "Flag Capture", "Foozpong", "Ice Hockey", "Joust", "Mario Bros", "Maze Craze", "Othello", "Pong", "Quadrapong", "Space Invaders", "Space War", "Surround", "Tennis", "Video Checkers", "Volleyball Pong", "Warlords", "Wizard of Wor", "Butterfly", "Cooperative Pong", "Knights Archers Zombies (\u2018KAZ\u2019)", "Pistonball", "Classic", "Chess", "Connect Four", "Gin Rummy", "Go", "Hanabi", "Leduc Hold\u2019em", "Rock Paper Scissors", "Texas Hold\u2019em", "Texas Hold\u2019em No Limit", "Tic Tac Toe", "<no title>", "MPE", "Simple", "Simple Adversary", "Simple Crypto", "Simple Push", "Simple Reference", "Simple Speaker Listener", "Simple Spread", "Simple Tag", "Simple World Comm", "SISL", "Multiwalker", "Pursuit", "Waterworld", "Third-Party Environments", "<no title>", "Release Notes", "AgileRL: Implementing DQN - Curriculum Learning and Self-play", "AgileRL: Implementing MADDPG", "AgileRL: Implementing MATD3", "AgileRL Tutorial", "CleanRL: Advanced PPO", "CleanRL: Implementing PPO", "CleanRL Tutorial", "Tutorial: Repository Structure", "Tutorial: Environment Logic", "Tutorial: Action Masking", "Tutorial: Testing Your Environment", "<no title>", "Custom Environment Tutorial", "<no title>", "LangChain Tutorial", "LangChain: Creating LLM agents", "RLlib: DQN for Simple Poker", "Ray RLlib Tutorial", "RLlib: PPO for Pistonball", "SB3: Action Masked PPO for Connect Four", "Stable-Baselines3 Tutorial", "SB3: PPO for Knights-Archers-Zombies", "SB3: PPO for Waterworld", "Tianshou: CLI and Logging", "Tianshou: Basic API Usage", "Tianshou Tutorial", "Tianshou: Training Agents"], "titleterms": {"0": 70, "1": 70, "10": 70, "11": 70, "12": 70, "13": 70, "14": 70, "15": 70, "16": 70, "17": 70, "18": 70, "19": 70, "2": 70, "20": 70, "21": 70, "22": 70, "23": 70, "24": 70, "3": 70, "4": 70, "404": 0, "5": 70, "6": 70, "7": 70, "8": 70, "9": 70, "No": [51, 86], "Not": 0, "The": 0, "With": 9, "about": 2, "action": [2, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 67, 80, 86, 90], "addit": [9, 78], "advanc": [75, 78], "adversari": 56, "aec": [2, 6, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68], "aecenv": 2, "agent": [4, 7, 8, 9, 10, 68, 71, 72, 73, 85, 86, 87, 89, 97], "agilerl": [71, 72, 73, 74], "ai": 68, "an": [1, 9], "api": [2, 3, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67, 68, 95], "archer": [40, 92], "architectur": [88, 96], "argument": [39, 40, 41, 45, 46, 47, 49, 50, 51, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67], "atari": 13, "attribut": 2, "augment": 85, "averag": 4, "base": 40, "baselin": 91, "baselines3": 91, "basic": [9, 95], "basketbal": 14, "battl": 68, "battlesnak": 68, "benchmark": 11, "bombermanai": 68, "box": 15, "breakout": 68, "bro": 25, "build": 1, "butterfli": 38, "can": [71, 72, 73], "captur": [4, 21], "carla": 68, "cathedr": 68, "chain": 85, "check": 9, "checker": 34, "chess": 43, "citat": [7, 8, 13, 54], "classic": [42, 90], "cleanrl": [75, 76, 77], "cli": 94, "clone": 68, "code": [71, 72, 73, 75, 76, 78, 79, 80, 81, 86, 87, 89, 90, 92, 93, 94, 95, 97], "cogment": 68, "combat": [16, 17], "comm": 63, "common": 13, "compat": 7, "competit": 19, "compon": 9, "concept": 54, "config": 71, "conflict_rez": 68, "connect": [44, 68, 71, 90], "control": [7, 39, 40, 66], "convers": 6, "cookingzoo": 68, "cooper": [20, 39], "could": 0, "craze": 26, "crazi": 68, "creat": 86, "creation": 10, "crypto": 57, "curriculum": 71, "custom": [10, 83], "cyber": 68, "cycl": 11, "data": 85, "death": 9, "deepmind": 7, "default": 40, "deprec": 10, "detail": 13, "develop": 10, "dilemma": 68, "doc": 1, "document": 1, "done": 9, "doubl": 18, "dqn": [71, 87], "drone": 68, "dsse": 68, "dunk": 18, "edit": 1, "em": [48, 50, 51], "emtomb": [19, 20], "entir": 9, "env": 68, "environ": [1, 7, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 47, 54, 68, 71, 72, 73, 75, 76, 79, 81, 83, 86, 87, 88, 89, 90, 92, 93, 94, 95, 97], "envlogg": 4, "evalu": [85, 90, 92, 93], "exampl": [2, 3, 10, 74, 77, 88, 96], "expand": 49, "fanorona": 68, "file": [71, 78], "flag": 21, "foozpong": 22, "found": 0, "four": [44, 68, 71, 90], "full": [71, 86], "function": 8, "galaga": 68, "game": [13, 49, 68], "gener": [71, 85], "gfootbal": 68, "gin": 45, "go": 46, "gobblet": 68, "ground": 68, "gym": 68, "gymnasium": [68, 86], "hanabi": 47, "hearth": 68, "histori": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66], "hockei": 23, "hold": [48, 50, 51], "holdem": 86, "i": [9, 71, 72, 73], "ic": 23, "idiom": 9, "imag": 40, "implement": [71, 72, 73, 76], "import": 71, "includ": 8, "initi": 9, "instal": [9, 13, 38, 42, 54, 64], "integr": 77, "interact": [9, 68], "introduct": [78, 79, 80, 81], "invad": 30, "joust": 24, "kaggl": 68, "kaz": 40, "kei": 54, "knight": [40, 92], "langchain": [85, 86], "latest": 68, "learn": 71, "leduc": 48, "legal": [43, 44, 45, 46, 47, 48, 50, 51, 52], "limit": [51, 86], "listen": 60, "llm": [85, 86], "log": 94, "logic": 79, "loop": [71, 86], "maddpg": [72, 73], "manual": [39, 40, 66], "mario": 25, "mask": [2, 43, 44, 45, 46, 47, 48, 50, 51, 52, 80, 86, 90], "mat": 68, "matd3": 73, "max": 11, "maze": 26, "melt": 7, "memori": 85, "method": 2, "minim": [14, 21, 22, 27, 28, 29, 30, 32, 34, 35, 36], "mmo": 68, "model": 71, "modul": 10, "mpe": 54, "mu": 68, "multi": [7, 8], "multipl": [72, 73], "multiwalk": 65, "muzero": 68, "neural": 68, "notabl": 9, "note": 70, "number": 9, "observ": [4, 11, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 67], "older": 68, "onli": 8, "openspiel": 7, "oper": 68, "option": [9, 78], "othello": 27, "other": 90, "overview": [13, 74, 77, 85, 88, 91, 96], "page": [0, 1], "paper": [49, 86], "parallel": [3, 6, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 49, 55, 56, 57, 58, 59, 60, 61, 62, 63, 65, 66, 67], "parallelenv": 3, "paramet": [13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "parti": 68, "perform": 11, "pettingzoo": [1, 6, 68, 70, 74, 77, 86, 88, 90, 96], "pistonbal": [41, 89], "plai": [71, 72, 73, 87, 89], "plane": 16, "pogema": 68, "poker": 87, "pong": [14, 28, 35, 39], "pot": 7, "ppo": [75, 76, 89, 90, 92, 93], "preprocess": 13, "prompt": 85, "pursuit": 66, "push": 58, "pz": 68, "quadrapong": 29, "racecar": 68, "rai": 88, "raw": 9, "recommend": 12, "refer": 59, "releas": 70, "render": [11, 54], "repositori": 78, "request": 0, "research": 68, "reward": [4, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 67], "rl": [68, 87, 89], "rllib": [87, 88, 89], "rock": [49, 86], "rummi": 45, "save": [4, 11], "sb3": [90, 92, 93], "scissor": [49, 86], "search": 68, "seed": 11, "selector": [4, 10], "self": 71, "sequenti": 68, "setup": [71, 72, 73, 75, 76, 86, 87, 89, 90, 92, 93, 94, 95, 97], "shimmi": 7, "simpl": [55, 56, 57, 58, 59, 60, 61, 62, 63, 87], "sisl": 64, "skeleton": 78, "skyjo_rl": 68, "smac": 68, "smacv2": 68, "soccer": 7, "social": 68, "space": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 65, 67], "speaker": 60, "spread": 61, "stabl": 91, "start": 12, "stdout": 4, "stone": 68, "structur": 78, "sumo": 68, "supersuit": 8, "support": 7, "surround": 32, "swarm": 68, "tac": [52, 86], "tactic": 68, "tag": 62, "tank": 17, "teamfight": 68, "tenni": 33, "termin": 54, "test": [1, 11, 81, 90], "texa": [50, 51, 86], "third": 68, "tianshou": [94, 95, 96, 97], "tic": [52, 86], "toe": [52, 86], "torer": 68, "total": 4, "train": [71, 72, 73, 87, 88, 89, 90, 92, 93, 97], "tree": 78, "tutori": [12, 74, 77, 78, 79, 80, 81, 83, 85, 88, 91, 96], "type": 54, "unwrap": 9, "us": [5, 10, 68, 71, 72, 73, 74, 77, 88, 96], "usag": [2, 3, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 95], "util": [4, 6, 10], "variabl": 9, "vector": 40, "vers": 68, "version": [14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 65, 66, 68], "video": 34, "volleybal": 35, "wandb": 77, "war": 31, "warlord": 36, "watch": [71, 72, 73, 87, 89], "waterworld": [67, 93], "weight": 71, "what": [71, 72, 73], "wizard": 37, "wor": 37, "world": 63, "wrapper": [5, 6, 7, 8, 10], "your": 81, "zombi": [40, 92]}}) \ No newline at end of file