{"version":1,"pages":[{"id":"-LterKS9HS0n1lQWmjmR","title":"SLM Lab","pathname":"/slm-lab/v4.2.0","siteSpaceId":"sitesp_L00gt","description":"Modular Deep Reinforcement Learning framework in PyTorch."},{"id":"-LtetdjtNeY6_S0sV9dF","title":"Installation","pathname":"/slm-lab/v4.2.0/setup/installation","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🖥Setup"}]},{"id":"-LtevlBNdLmRiVu8Mu3G","title":"Quick Start","pathname":"/slm-lab/v4.2.0/setup/quick-start","siteSpaceId":"sitesp_L00gt","description":"To test the installation.","breadcrumbs":[{"label":"🖥Setup"}]},{"id":"-LthpAeI_RGeAE6rGuZS","title":"Lab Command","pathname":"/slm-lab/v4.2.0/using-slm-lab/slm-lab-command","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu0GqNzEpmVBs5aqj46","title":"Lab Organization","pathname":"/slm-lab/v4.2.0/using-slm-lab/lab-organization","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu0dA__Nq1nB894SsWV","title":"Train: REINFORCE CartPole","pathname":"/slm-lab/v4.2.0/using-slm-lab/train-and-enjoy-dqn-cartpole","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-M4tVbdlLJwaEAB8YoPJ","title":"Resume and Enjoy: REINFORCE CartPole","pathname":"/slm-lab/v4.2.0/using-slm-lab/resume-and-enjoy-reinforce-cartpole","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthqahlEeoIIsZ06zLV","title":"Agent Spec: DDQN+PER on LunarLander","pathname":"/slm-lab/v4.2.0/using-slm-lab/agent-spec-ddqn+per-on-lunarlander","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthqlKBQyGp3Bi12-aU","title":"Env Spec: A2C on Pong","pathname":"/slm-lab/v4.2.0/using-slm-lab/environment-spec-a2c-on-bipedalwalker","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthqnykF_9LpvLbntB1","title":"GPU Usage: PPO on Pong","pathname":"/slm-lab/v4.2.0/using-slm-lab/gpu-usage-ppo-on-pong","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthrO3XSjIXpesSKLs8","title":"Parallelizing Training: Async SAC on Humanoid","pathname":"/slm-lab/v4.2.0/using-slm-lab/parallelizing-training-async-sac-on-humanoid","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lthz5HIxAIjWUM5WeSc","title":"Experiment and Search Spec: PPO on Breakout","pathname":"/slm-lab/v4.2.0/using-slm-lab/search-spec-ppo-on-breakout","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LtvuZi_3yhTG9PoFBBP","title":"Run Benchmark: A2C on Atari Games","pathname":"/slm-lab/v4.2.0/using-slm-lab/run-benchmark-a2c-on-atari-games","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Luy5RkIoK6qltM7Mzwz","title":"Meta Spec: High Level Specifications","pathname":"/slm-lab/v4.2.0/using-slm-lab/meta-spec-high-level-specifications","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu0TBCyNbOoeqFW1W5E","title":"Post-Hoc Analysis","pathname":"/slm-lab/v4.2.0/using-slm-lab/post-hoc-analysis","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu3jBvYUWQwVU9fvCIc","title":"TensorBoard: Visualizing Models and Actions","pathname":"/slm-lab/v4.2.0/using-slm-lab/tensorboard-visualizing-models-and-actions","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lti-lPTXdwpliw8hkXa","title":"Using SLM Lab In Your Project","pathname":"/slm-lab/v4.2.0/using-slm-lab/using-slm-lab-in-your-project","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LterM61KjikSY8FA_E7","title":"Data Locations","pathname":"/slm-lab/v4.2.0/analyzing-results/analytics","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"📈Analyzing Results"}]},{"id":"-LterM65ALqarawv7l3Q","title":"Graphs and Data","pathname":"/slm-lab/v4.2.0/analyzing-results/session-graph","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"📈Analyzing Results"}]},{"id":"-M-VdXUSZpJPb-tMSTDN","title":"Performance Metrics","pathname":"/slm-lab/v4.2.0/analyzing-results/performance-metrics","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"📈Analyzing Results"}]},{"id":"-Lu0bsgEkSvzG3x5Sa5z","title":"Public Benchmark Data","pathname":"/slm-lab/v4.2.0/benchmark-results/public-benchmark-data","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lti3U-T96_jSYz332kZ","title":"Discrete Environment Benchmark","pathname":"/slm-lab/v4.2.0/benchmark-results/discrete-benchmark","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lti3gXXj0E3FSY-F3PY","title":"Continuous Environment Benchmark","pathname":"/slm-lab/v4.2.0/benchmark-results/continuous-benchmark","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lti3lLfTXQJ-9FacY6u","title":"Atari Environment Benchmark","pathname":"/slm-lab/v4.2.0/benchmark-results/atari-benchmark","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-LuE4en9ToLToatNHXHV","title":"RL GIFs","pathname":"/slm-lab/v4.2.0/benchmark-results/rl-gifs","siteSpaceId":"sitesp_L00gt","description":"A collection of replay GIFs generated from SLM Lab agents in \"enjoy\" mode.","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lu0MnaZtslkKTeLfbEP","title":"Modular Design","pathname":"/slm-lab/v4.2.0/development/modular-lab-components","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-Lu8ngGlJ2ezSyAUwe3K","title":"Algorithm Taxonomy","pathname":"/slm-lab/v4.2.0/development/modular-lab-components/algorithm-taxonomy","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Modular Design"}]},{"id":"-Lu8nsnRc6B3qQXsQ-SH","title":"Class Inheritance: A2C > PPO","pathname":"/slm-lab/v4.2.0/development/modular-lab-components/class-inheritance-a2c-greater-than-ppo","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Modular Design"}]},{"id":"-LterM67Q0oedx9zf1aO","title":"Algorithm","pathname":"/slm-lab/v4.2.0/development/algorithms","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-LterM68QAuqU8BRS1IS","title":"DQN","pathname":"/slm-lab/v4.2.0/development/algorithms/dqn","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Algorithm"}]},{"id":"-LterM69lsUmITlcjdAg","title":"REINFORCE","pathname":"/slm-lab/v4.2.0/development/algorithms/reinforce","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Algorithm"}]},{"id":"-LterM6AsV56I_kYMC3V","title":"Actor Critic","pathname":"/slm-lab/v4.2.0/development/algorithms/a2c","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Algorithm"}]},{"id":"-LterM6FHmh1jISAyqNF","title":"Memory","pathname":"/slm-lab/v4.2.0/development/memory","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-LterM6G8YWJIY6wM7av","title":"Replay","pathname":"/slm-lab/v4.2.0/development/memory/replay","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LuDvz92OMcOUlDFQo2A","title":"PrioritizedReplay","pathname":"/slm-lab/v4.2.0/development/memory/prioritizedreplay","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LterM6HqCk-OKhtOnj-","title":"OnPolicyReplay","pathname":"/slm-lab/v4.2.0/development/memory/batch","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LterM6I0vZSi7ELIHE8","title":"OnPolicyBatchReplay","pathname":"/slm-lab/v4.2.0/development/memory/episodic","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LterM6BJgs8kuTKickL","title":"Net","pathname":"/slm-lab/v4.2.0/development/neural-networks","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-LterM6CcDfTA4AUTzyZ","title":"MLP","pathname":"/slm-lab/v4.2.0/development/neural-networks/mlp","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Net"}]},{"id":"-LterM6DNa6pe0Eg8ebG","title":"CNN","pathname":"/slm-lab/v4.2.0/development/neural-networks/cnn","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Net"}]},{"id":"-LterM6E9b4cP3nirtNx","title":"RNN","pathname":"/slm-lab/v4.2.0/development/neural-networks/rnn","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Net"}]},{"id":"-LtwOeTez_53joLfC5gq","title":"Profiling SLM Lab","pathname":"/slm-lab/v4.2.0/development/profiling-slm-lab","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-Lti2AOZ5QhK3EY4UM_q","title":"Book: Foundations of Deep Reinforcement Learning","pathname":"/slm-lab/v4.2.0/publications-and-talks/instruction-for-the-book-+-intro-to-rl-section","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"📖Publications and Talks"}]},{"id":"-Lu0REXSPoyG5dsFgvTt","title":"Talks and Presentations","pathname":"/slm-lab/v4.2.0/publications-and-talks/talks-given-with-slm-lab","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"📖Publications and Talks"}]},{"id":"-Ltjuk46SVjugXyZ2n8g","title":"Deep RL Resources","pathname":"/slm-lab/v4.2.0/resources/untitled","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-Lu1f2XH9CsbzK4-kUq-","title":"Contributing","pathname":"/slm-lab/v4.2.0/resources/contributing","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LterM5mYO2PcMxZVqE5","title":"Motivation","pathname":"/slm-lab/v4.2.0/resources/motivation","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LthvH4DQzSve0YYn29K","title":"Help","pathname":"/slm-lab/v4.2.0/resources/help","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LterM5noiDZ8TVPXl6p","title":"Contact","pathname":"/slm-lab/v4.2.0/resources/contacts","siteSpaceId":"sitesp_L00gt","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LterKS9HS0n1lQWmjmR","title":"SLM Lab","pathname":"/slm-lab/master","siteSpaceId":"sitesp_ZWWN5","description":"Modular Deep Reinforcement Learning framework in PyTorch."},{"id":"-LtetdjtNeY6_S0sV9dF","title":"Installation","pathname":"/slm-lab/master/setup/installation","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🖥Setup"}]},{"id":"-LtevlBNdLmRiVu8Mu3G","title":"Quick Start","pathname":"/slm-lab/master/setup/quick-start","siteSpaceId":"sitesp_ZWWN5","description":"To test the installation.","breadcrumbs":[{"label":"🖥Setup"}]},{"id":"-LthpAeI_RGeAE6rGuZS","title":"Lab Command","pathname":"/slm-lab/master/using-slm-lab/slm-lab-command","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu0GqNzEpmVBs5aqj46","title":"Lab Organization","pathname":"/slm-lab/master/using-slm-lab/lab-organization","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu0dA__Nq1nB894SsWV","title":"Train and Enjoy: REINFORCE CartPole","pathname":"/slm-lab/master/using-slm-lab/train-and-enjoy-dqn-cartpole","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthqahlEeoIIsZ06zLV","title":"Agent Spec: DDQN+PER on LunarLander","pathname":"/slm-lab/master/using-slm-lab/agent-spec-ddqn+per-on-lunarlander","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthqlKBQyGp3Bi12-aU","title":"Env Spec: A2C on Pong","pathname":"/slm-lab/master/using-slm-lab/environment-spec-a2c-on-bipedalwalker","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthqnykF_9LpvLbntB1","title":"GPU Usage: PPO on Pong","pathname":"/slm-lab/master/using-slm-lab/gpu-usage-ppo-on-pong","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthrO3XSjIXpesSKLs8","title":"Parallelizing Training: Async SAC on Humanoid","pathname":"/slm-lab/master/using-slm-lab/parallelizing-training-async-sac-on-humanoid","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lthz5HIxAIjWUM5WeSc","title":"Experiment and Search Spec: PPO on Breakout","pathname":"/slm-lab/master/using-slm-lab/search-spec-ppo-on-breakout","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LtvuZi_3yhTG9PoFBBP","title":"Run Benchmark: A2C on Atari Games","pathname":"/slm-lab/master/using-slm-lab/run-benchmark-a2c-on-atari-games","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Luy5RkIoK6qltM7Mzwz","title":"Meta Spec: High Level Specifications","pathname":"/slm-lab/master/using-slm-lab/meta-spec-high-level-specifications","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu0TBCyNbOoeqFW1W5E","title":"Post-Hoc Analysis","pathname":"/slm-lab/master/using-slm-lab/post-hoc-analysis","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu3jBvYUWQwVU9fvCIc","title":"TensorBoard: Visualizing Models and Actions","pathname":"/slm-lab/master/using-slm-lab/tensorboard-visualizing-models-and-actions","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lti-lPTXdwpliw8hkXa","title":"Using SLM Lab In Your Project","pathname":"/slm-lab/master/using-slm-lab/using-slm-lab-in-your-project","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LterM61KjikSY8FA_E7","title":"Data Locations","pathname":"/slm-lab/master/analyzing-results/analytics","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"📈Analyzing Results"}]},{"id":"-LterM65ALqarawv7l3Q","title":"Graphs and Data","pathname":"/slm-lab/master/analyzing-results/session-graph","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"📈Analyzing Results"}]},{"id":"-M-VdXUSZpJPb-tMSTDN","title":"Performance Metrics","pathname":"/slm-lab/master/analyzing-results/performance-metrics","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"📈Analyzing Results"}]},{"id":"-Lu0bsgEkSvzG3x5Sa5z","title":"Public Benchmark Data","pathname":"/slm-lab/master/benchmark-results/public-benchmark-data","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lti3U-T96_jSYz332kZ","title":"Discrete Environment Benchmark","pathname":"/slm-lab/master/benchmark-results/discrete-benchmark","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lti3gXXj0E3FSY-F3PY","title":"Continuous Environment Benchmark","pathname":"/slm-lab/master/benchmark-results/continuous-benchmark","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lti3lLfTXQJ-9FacY6u","title":"Atari Environment Benchmark","pathname":"/slm-lab/master/benchmark-results/atari-benchmark","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-LuE4en9ToLToatNHXHV","title":"RL GIFs","pathname":"/slm-lab/master/benchmark-results/rl-gifs","siteSpaceId":"sitesp_ZWWN5","description":"A collection of replay GIFs generated from SLM Lab agents in \"enjoy\" mode.","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lu0MnaZtslkKTeLfbEP","title":"Modular Design","pathname":"/slm-lab/master/development/modular-lab-components","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-Lu8ngGlJ2ezSyAUwe3K","title":"Algorithm Taxonomy","pathname":"/slm-lab/master/development/modular-lab-components/algorithm-taxonomy","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Modular Design"}]},{"id":"-Lu8nsnRc6B3qQXsQ-SH","title":"Class Inheritance: A2C > PPO","pathname":"/slm-lab/master/development/modular-lab-components/class-inheritance-a2c-greater-than-ppo","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Modular Design"}]},{"id":"-LterM67Q0oedx9zf1aO","title":"Algorithm","pathname":"/slm-lab/master/development/algorithms","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-LterM68QAuqU8BRS1IS","title":"DQN","pathname":"/slm-lab/master/development/algorithms/dqn","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Algorithm"}]},{"id":"-LterM69lsUmITlcjdAg","title":"REINFORCE","pathname":"/slm-lab/master/development/algorithms/reinforce","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Algorithm"}]},{"id":"-LterM6AsV56I_kYMC3V","title":"Actor Critic","pathname":"/slm-lab/master/development/algorithms/a2c","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Algorithm"}]},{"id":"-LterM6FHmh1jISAyqNF","title":"Memory","pathname":"/slm-lab/master/development/memory","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-LterM6G8YWJIY6wM7av","title":"Replay","pathname":"/slm-lab/master/development/memory/replay","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LuDvz92OMcOUlDFQo2A","title":"PrioritizedReplay","pathname":"/slm-lab/master/development/memory/prioritizedreplay","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LterM6HqCk-OKhtOnj-","title":"OnPolicyReplay","pathname":"/slm-lab/master/development/memory/batch","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LterM6I0vZSi7ELIHE8","title":"OnPolicyBatchReplay","pathname":"/slm-lab/master/development/memory/episodic","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LterM6BJgs8kuTKickL","title":"Net","pathname":"/slm-lab/master/development/neural-networks","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-LterM6CcDfTA4AUTzyZ","title":"MLP","pathname":"/slm-lab/master/development/neural-networks/mlp","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Net"}]},{"id":"-LterM6DNa6pe0Eg8ebG","title":"CNN","pathname":"/slm-lab/master/development/neural-networks/cnn","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Net"}]},{"id":"-LterM6E9b4cP3nirtNx","title":"RNN","pathname":"/slm-lab/master/development/neural-networks/rnn","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Net"}]},{"id":"-LtwOeTez_53joLfC5gq","title":"Profiling SLM Lab","pathname":"/slm-lab/master/development/profiling-slm-lab","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-Lti2AOZ5QhK3EY4UM_q","title":"Book: Foundations of Deep Reinforcement Learning","pathname":"/slm-lab/master/publications-and-talks/instruction-for-the-book-+-intro-to-rl-section","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"📖Publications and Talks"}]},{"id":"-Lu0REXSPoyG5dsFgvTt","title":"Talks and Presentations","pathname":"/slm-lab/master/publications-and-talks/talks-given-with-slm-lab","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"📖Publications and Talks"}]},{"id":"-Ltjuk46SVjugXyZ2n8g","title":"Deep RL Resources","pathname":"/slm-lab/master/resources/untitled","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-Lu1f2XH9CsbzK4-kUq-","title":"Contributing","pathname":"/slm-lab/master/resources/contributing","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LterM5mYO2PcMxZVqE5","title":"Motivation","pathname":"/slm-lab/master/resources/motivation","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LthvH4DQzSve0YYn29K","title":"Help","pathname":"/slm-lab/master/resources/help","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LterM5noiDZ8TVPXl6p","title":"Contact","pathname":"/slm-lab/master/resources/contacts","siteSpaceId":"sitesp_ZWWN5","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LterKS9HS0n1lQWmjmR","title":"SLM Lab","pathname":"/slm-lab/v4.2.3","siteSpaceId":"sitesp_RQQtq","description":"Modular Deep Reinforcement Learning framework in PyTorch."},{"id":"-LtetdjtNeY6_S0sV9dF","title":"Installation","pathname":"/slm-lab/v4.2.3/setup/installation","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🖥Setup"}]},{"id":"-LtevlBNdLmRiVu8Mu3G","title":"Quick Start","pathname":"/slm-lab/v4.2.3/setup/quick-start","siteSpaceId":"sitesp_RQQtq","description":"To test the installation.","breadcrumbs":[{"label":"🖥Setup"}]},{"id":"-LthpAeI_RGeAE6rGuZS","title":"Lab Command","pathname":"/slm-lab/v4.2.3/using-slm-lab/slm-lab-command","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu0GqNzEpmVBs5aqj46","title":"Lab Organization","pathname":"/slm-lab/v4.2.3/using-slm-lab/lab-organization","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu0dA__Nq1nB894SsWV","title":"Train: REINFORCE CartPole","pathname":"/slm-lab/v4.2.3/using-slm-lab/train-and-enjoy-dqn-cartpole","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-M4tVbdlLJwaEAB8YoPJ","title":"Resume and Enjoy: REINFORCE CartPole","pathname":"/slm-lab/v4.2.3/using-slm-lab/resume-and-enjoy-reinforce-cartpole","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthqahlEeoIIsZ06zLV","title":"Agent Spec: DDQN+PER on LunarLander","pathname":"/slm-lab/v4.2.3/using-slm-lab/agent-spec-ddqn+per-on-lunarlander","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthqlKBQyGp3Bi12-aU","title":"Env Spec: A2C on Pong","pathname":"/slm-lab/v4.2.3/using-slm-lab/environment-spec-a2c-on-bipedalwalker","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthqnykF_9LpvLbntB1","title":"GPU Usage: PPO on Pong","pathname":"/slm-lab/v4.2.3/using-slm-lab/gpu-usage-ppo-on-pong","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LthrO3XSjIXpesSKLs8","title":"Parallelizing Training: Async SAC on Humanoid","pathname":"/slm-lab/v4.2.3/using-slm-lab/parallelizing-training-async-sac-on-humanoid","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lthz5HIxAIjWUM5WeSc","title":"Experiment and Search Spec: PPO on Breakout","pathname":"/slm-lab/v4.2.3/using-slm-lab/search-spec-ppo-on-breakout","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LtvuZi_3yhTG9PoFBBP","title":"Run Benchmark: A2C on Atari Games","pathname":"/slm-lab/v4.2.3/using-slm-lab/run-benchmark-a2c-on-atari-games","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Luy5RkIoK6qltM7Mzwz","title":"Meta Spec: High Level Specifications","pathname":"/slm-lab/v4.2.3/using-slm-lab/meta-spec-high-level-specifications","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu0TBCyNbOoeqFW1W5E","title":"Post-Hoc Analysis","pathname":"/slm-lab/v4.2.3/using-slm-lab/post-hoc-analysis","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lu3jBvYUWQwVU9fvCIc","title":"TensorBoard: Visualizing Models and Actions","pathname":"/slm-lab/v4.2.3/using-slm-lab/tensorboard-visualizing-models-and-actions","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-Lti-lPTXdwpliw8hkXa","title":"Using SLM Lab In Your Project","pathname":"/slm-lab/v4.2.3/using-slm-lab/using-slm-lab-in-your-project","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🚀Using SLM Lab"}]},{"id":"-LterM61KjikSY8FA_E7","title":"Data Locations","pathname":"/slm-lab/v4.2.3/analyzing-results/analytics","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"📈Analyzing Results"}]},{"id":"-LterM65ALqarawv7l3Q","title":"Graphs and Data","pathname":"/slm-lab/v4.2.3/analyzing-results/session-graph","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"📈Analyzing Results"}]},{"id":"-M-VdXUSZpJPb-tMSTDN","title":"Performance Metrics","pathname":"/slm-lab/v4.2.3/analyzing-results/performance-metrics","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"📈Analyzing Results"}]},{"id":"-Lu0bsgEkSvzG3x5Sa5z","title":"Public Benchmark Data","pathname":"/slm-lab/v4.2.3/benchmark-results/public-benchmark-data","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lti3U-T96_jSYz332kZ","title":"Discrete Environment Benchmark","pathname":"/slm-lab/v4.2.3/benchmark-results/discrete-benchmark","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lti3gXXj0E3FSY-F3PY","title":"Continuous Environment Benchmark","pathname":"/slm-lab/v4.2.3/benchmark-results/continuous-benchmark","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lti3lLfTXQJ-9FacY6u","title":"Atari Environment Benchmark","pathname":"/slm-lab/v4.2.3/benchmark-results/atari-benchmark","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-LuE4en9ToLToatNHXHV","title":"RL GIFs","pathname":"/slm-lab/v4.2.3/benchmark-results/rl-gifs","siteSpaceId":"sitesp_RQQtq","description":"A collection of replay GIFs generated from SLM Lab agents in \"enjoy\" mode.","breadcrumbs":[{"label":"🥇Benchmark Results"}]},{"id":"-Lu0MnaZtslkKTeLfbEP","title":"Modular Design","pathname":"/slm-lab/v4.2.3/development/modular-lab-components","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-Lu8ngGlJ2ezSyAUwe3K","title":"Algorithm Taxonomy","pathname":"/slm-lab/v4.2.3/development/modular-lab-components/algorithm-taxonomy","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Modular Design"}]},{"id":"-Lu8nsnRc6B3qQXsQ-SH","title":"Class Inheritance: A2C > PPO","pathname":"/slm-lab/v4.2.3/development/modular-lab-components/class-inheritance-a2c-greater-than-ppo","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Modular Design"}]},{"id":"-LterM67Q0oedx9zf1aO","title":"Algorithm","pathname":"/slm-lab/v4.2.3/development/algorithms","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-LterM68QAuqU8BRS1IS","title":"DQN","pathname":"/slm-lab/v4.2.3/development/algorithms/dqn","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Algorithm"}]},{"id":"-LterM69lsUmITlcjdAg","title":"REINFORCE","pathname":"/slm-lab/v4.2.3/development/algorithms/reinforce","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Algorithm"}]},{"id":"-LterM6AsV56I_kYMC3V","title":"Actor Critic","pathname":"/slm-lab/v4.2.3/development/algorithms/a2c","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Algorithm"}]},{"id":"-LterM6FHmh1jISAyqNF","title":"Memory","pathname":"/slm-lab/v4.2.3/development/memory","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-LterM6G8YWJIY6wM7av","title":"Replay","pathname":"/slm-lab/v4.2.3/development/memory/replay","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LuDvz92OMcOUlDFQo2A","title":"PrioritizedReplay","pathname":"/slm-lab/v4.2.3/development/memory/prioritizedreplay","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LterM6HqCk-OKhtOnj-","title":"OnPolicyReplay","pathname":"/slm-lab/v4.2.3/development/memory/batch","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LterM6I0vZSi7ELIHE8","title":"OnPolicyBatchReplay","pathname":"/slm-lab/v4.2.3/development/memory/episodic","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Memory"}]},{"id":"-LterM6BJgs8kuTKickL","title":"Net","pathname":"/slm-lab/v4.2.3/development/neural-networks","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-LterM6CcDfTA4AUTzyZ","title":"MLP","pathname":"/slm-lab/v4.2.3/development/neural-networks/mlp","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Net"}]},{"id":"-LterM6DNa6pe0Eg8ebG","title":"CNN","pathname":"/slm-lab/v4.2.3/development/neural-networks/cnn","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Net"}]},{"id":"-LterM6E9b4cP3nirtNx","title":"RNN","pathname":"/slm-lab/v4.2.3/development/neural-networks/rnn","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"},{"label":"Net"}]},{"id":"-LtwOeTez_53joLfC5gq","title":"Profiling SLM Lab","pathname":"/slm-lab/v4.2.3/development/profiling-slm-lab","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🔧Development"}]},{"id":"-Lti2AOZ5QhK3EY4UM_q","title":"Book: Foundations of Deep Reinforcement Learning","pathname":"/slm-lab/v4.2.3/publications-and-talks/instruction-for-the-book-+-intro-to-rl-section","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"📖Publications and Talks"}]},{"id":"-Lu0REXSPoyG5dsFgvTt","title":"Talks and Presentations","pathname":"/slm-lab/v4.2.3/publications-and-talks/talks-given-with-slm-lab","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"📖Publications and Talks"}]},{"id":"-Ltjuk46SVjugXyZ2n8g","title":"Deep RL Resources","pathname":"/slm-lab/v4.2.3/resources/untitled","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-Lu1f2XH9CsbzK4-kUq-","title":"Contributing","pathname":"/slm-lab/v4.2.3/resources/contributing","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LterM5mYO2PcMxZVqE5","title":"Motivation","pathname":"/slm-lab/v4.2.3/resources/motivation","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LthvH4DQzSve0YYn29K","title":"Help","pathname":"/slm-lab/v4.2.3/resources/help","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"-LterM5noiDZ8TVPXl6p","title":"Contact","pathname":"/slm-lab/v4.2.3/resources/contacts","siteSpaceId":"sitesp_RQQtq","description":"","breadcrumbs":[{"label":"🤓Resources"}]},{"id":"S9L9DzVjVevDRH8OzUJR","title":"SLM Lab","pathname":"/slm-lab/v5.0.0","siteSpaceId":"sitesp_J00bs","description":"Modular Deep Reinforcement Learning framework in PyTorch."},{"id":"cexAjDVZTl0F53bT51yO","title":"Installation","pathname":"/slm-lab/v5.0.0/setup/installation","siteSpaceId":"sitesp_J00bs","emoji":"1f4e6","description":"","breadcrumbs":[{"label":"Setup","emoji":"1f5a5"}]},{"id":"5wVqjGKjJXbTD6kEjAkE","title":"Quick Start","pathname":"/slm-lab/v5.0.0/setup/quick-start","siteSpaceId":"sitesp_J00bs","emoji":"26a1","description":"Test your installation with a quick demo.","breadcrumbs":[{"label":"Setup","emoji":"1f5a5"}]},{"id":"WBTrRuD8uxP1idrVTGiF","title":"Train: PPO on CartPole","pathname":"/slm-lab/v5.0.0/using-slm-lab/train-ppo-cartpole","siteSpaceId":"sitesp_J00bs","emoji":"25b6","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"JmgCC7CgDtkAJpVFqaoO","title":"Resume and Replay","pathname":"/slm-lab/v5.0.0/using-slm-lab/resume-and-replay","siteSpaceId":"sitesp_J00bs","emoji":"1f504","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"47T5PIPk0jCFd1FYHRBt","title":"Core Concepts","pathname":"/slm-lab/v5.0.0/using-slm-lab/lab-organization","siteSpaceId":"sitesp_J00bs","emoji":"1f393","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"zaXBbWzB2BSkHDYroG0J","title":"Agent Spec","pathname":"/slm-lab/v5.0.0/using-slm-lab/agent-spec-ddqn+per-on-lunarlander","siteSpaceId":"sitesp_J00bs","emoji":"1f916","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"CaZeyiuhanc4ZmkkkezT","title":"Env Spec","pathname":"/slm-lab/v5.0.0/using-slm-lab/environment-spec-a2c-on-bipedalwalker","siteSpaceId":"sitesp_J00bs","emoji":"1f30d","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"u92CkYm7oZ7nhVaRZdAM","title":"Meta Spec","pathname":"/slm-lab/v5.0.0/using-slm-lab/meta-spec-high-level-specifications","siteSpaceId":"sitesp_J00bs","emoji":"2699","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"dqkeuolRG6TYBXCp28wV","title":"Search Spec","pathname":"/slm-lab/v5.0.0/using-slm-lab/search-spec-ppo-on-breakout","siteSpaceId":"sitesp_J00bs","emoji":"1f50d","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"A6SK3H0UrjVC5eolNewn","title":"GPU Training","pathname":"/slm-lab/v5.0.0/using-slm-lab/gpu-usage-ppo-on-pong","siteSpaceId":"sitesp_J00bs","emoji":"1f3ae","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"7OEMkHZwMQM0yemyN2hL","title":"Remote Training","pathname":"/slm-lab/v5.0.0/using-slm-lab/remote-training","siteSpaceId":"sitesp_J00bs","emoji":"2601","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"3fnls6E2rrIfYozYbIi5","title":"Async Training: Hogwild!","pathname":"/slm-lab/v5.0.0/using-slm-lab/async-training-a3c-hogwild","siteSpaceId":"sitesp_J00bs","emoji":"26a1","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"dmfN8Vw0BweHzE1gtdKs","title":"Running Benchmarks","pathname":"/slm-lab/v5.0.0/using-slm-lab/benchmark-specs","siteSpaceId":"sitesp_J00bs","emoji":"1f4cb","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"5WrerdraLuYUPJIRqtZ6","title":"CLI Reference","pathname":"/slm-lab/v5.0.0/using-slm-lab/slm-lab-command","siteSpaceId":"sitesp_J00bs","emoji":"1f4bb","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"jSjb2jsf7y2nVnnSjsl4","title":"Data Locations","pathname":"/slm-lab/v5.0.0/analyzing-results/analytics","siteSpaceId":"sitesp_J00bs","emoji":"1f4c1","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"Um0h28YSYgLhaJyUemau","title":"Graphs and Data","pathname":"/slm-lab/v5.0.0/analyzing-results/session-graph","siteSpaceId":"sitesp_J00bs","emoji":"1f4ca","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"LA3qCClsIPgnbZX6RpaQ","title":"TensorBoard","pathname":"/slm-lab/v5.0.0/analyzing-results/tensorboard-visualizing-models-and-actions","siteSpaceId":"sitesp_J00bs","emoji":"1f4c9","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"TKMnT3oMT21aP5qtzpmT","title":"Performance Metrics","pathname":"/slm-lab/v5.0.0/analyzing-results/performance-metrics","siteSpaceId":"sitesp_J00bs","emoji":"1f3af","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"GUPYoFg1I0BnsOdCX4QZ","title":"Post-Hoc Analysis","pathname":"/slm-lab/v5.0.0/analyzing-results/post-hoc-analysis","siteSpaceId":"sitesp_J00bs","emoji":"1f52c","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"4cUU3NEfxKv8FIFmBosQ","title":"Public Benchmark Data","pathname":"/slm-lab/v5.0.0/benchmark-results/public-benchmark-data","siteSpaceId":"sitesp_J00bs","emoji":"1f517","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"CD8k8pRWnWAlpPHbNbff","title":"Discrete Benchmark","pathname":"/slm-lab/v5.0.0/benchmark-results/discrete-benchmark","siteSpaceId":"sitesp_J00bs","emoji":"1f3af","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"3xK4QuUupCLmckIbJvn4","title":"Continuous Benchmark","pathname":"/slm-lab/v5.0.0/benchmark-results/continuous-benchmark","siteSpaceId":"sitesp_J00bs","emoji":"1f3c3","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"sAyToR6IsoZrbHEdzW1a","title":"Atari Benchmark","pathname":"/slm-lab/v5.0.0/benchmark-results/atari-benchmark","siteSpaceId":"sitesp_J00bs","emoji":"1f47e","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"NEpmlhJ3EnFqqhKUZ2ef","title":"RL GIFs","pathname":"/slm-lab/v5.0.0/benchmark-results/rl-gifs","siteSpaceId":"sitesp_J00bs","emoji":"1f3ac","description":"Trained agents in action—watch SLM Lab's PPO and SAC algorithms play games and control robots.","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"evsksG6VHELPlRD6ikvE","title":"Architecture","pathname":"/slm-lab/v5.0.0/development/architecture","siteSpaceId":"sitesp_J00bs","emoji":"1f3d7","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"yfghm0NtzKpFnZjZW4bJ","title":"Modular Design","pathname":"/slm-lab/v5.0.0/development/modular-lab-components","siteSpaceId":"sitesp_J00bs","emoji":"1f9e9","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"JtCyJq1FbbUfEvTAWzLF","title":"Algorithm Taxonomy","pathname":"/slm-lab/v5.0.0/development/modular-lab-components/algorithm-taxonomy","siteSpaceId":"sitesp_J00bs","emoji":"1f4da","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Modular Design","emoji":"1f9e9"}]},{"id":"3DCSQEUmJF4i3zuha6zJ","title":"Class Inheritance: A2C > PPO","pathname":"/slm-lab/v5.0.0/development/modular-lab-components/class-inheritance-a2c-greater-than-ppo","siteSpaceId":"sitesp_J00bs","emoji":"1f517","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Modular Design","emoji":"1f9e9"}]},{"id":"9znMVLdwRBIV5gfjYNgb","title":"Algorithm Families","pathname":"/slm-lab/v5.0.0/development/algorithms","siteSpaceId":"sitesp_J00bs","emoji":"1f9e0","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"HdhFNcQRds2PIjLxy7Vs","title":"DQN","pathname":"/slm-lab/v5.0.0/development/algorithms/dqn","siteSpaceId":"sitesp_J00bs","emoji":"1f48e","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"hssFCd6EDmGzbguqs4q0","title":"REINFORCE","pathname":"/slm-lab/v5.0.0/development/algorithms/reinforce","siteSpaceId":"sitesp_J00bs","emoji":"1f3b2","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"YIgCZZDQDCv9wpElWqCl","title":"Actor-Critic","pathname":"/slm-lab/v5.0.0/development/algorithms/a2c","siteSpaceId":"sitesp_J00bs","emoji":"1f3ad","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"PIcm3ts1de5NJpG6eniv","title":"Memory","pathname":"/slm-lab/v5.0.0/development/memory","siteSpaceId":"sitesp_J00bs","emoji":"1f4be","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"jplaG44MiQmw7Hb5KDmS","title":"Replay","pathname":"/slm-lab/v5.0.0/development/memory/replay","siteSpaceId":"sitesp_J00bs","emoji":"1f504","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"CN5FRuBn7So8Se63cab7","title":"PrioritizedReplay","pathname":"/slm-lab/v5.0.0/development/memory/prioritizedreplay","siteSpaceId":"sitesp_J00bs","emoji":"2b50","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"hBcXqn07YEG82KiUQZHq","title":"OnPolicyReplay","pathname":"/slm-lab/v5.0.0/development/memory/onpolicyreplay","siteSpaceId":"sitesp_J00bs","emoji":"1f4e4","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"WWMdvMPnT8pDh2apqdP2","title":"OnPolicyBatchReplay","pathname":"/slm-lab/v5.0.0/development/memory/onpolicybatchreplay","siteSpaceId":"sitesp_J00bs","emoji":"1f4e6","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"eGE4a6sZ5IVbwHJT4wed","title":"Net","pathname":"/slm-lab/v5.0.0/development/neural-networks","siteSpaceId":"sitesp_J00bs","emoji":"1f9ec","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"ZWvvCHWfMXbboV635U3V","title":"MLP","pathname":"/slm-lab/v5.0.0/development/neural-networks/mlp","siteSpaceId":"sitesp_J00bs","emoji":"1f522","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"z9rP5ohFoHMpVToF16TR","title":"CNN","pathname":"/slm-lab/v5.0.0/development/neural-networks/cnn","siteSpaceId":"sitesp_J00bs","emoji":"1f5bc","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"za7nBA4SPgAz6i4QuQ6M","title":"RNN","pathname":"/slm-lab/v5.0.0/development/neural-networks/rnn","siteSpaceId":"sitesp_J00bs","emoji":"1f501","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"YsvpJ9zLyacAl5zlbCAQ","title":"Profiling SLM Lab","pathname":"/slm-lab/v5.0.0/development/profiling-slm-lab","siteSpaceId":"sitesp_J00bs","emoji":"23f1","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"B69YmTAxYUsqaTf3FjUe","title":"Using SLM Lab In Your Project","pathname":"/slm-lab/v5.0.0/development/using-slm-lab-in-your-project","siteSpaceId":"sitesp_J00bs","emoji":"1f50c","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"1SvUsTfLloiHzCnONtFt","title":"Book: Foundations of Deep RL","pathname":"/slm-lab/v5.0.0/publications-and-talks/instruction-for-the-book-+-intro-to-rl-section","siteSpaceId":"sitesp_J00bs","emoji":"1f4d5","description":"","breadcrumbs":[{"label":"Publications and Talks","emoji":"1f4d6"}]},{"id":"MFSk7LVlfRP6xHa7V9WE","title":"Talks and Presentations","pathname":"/slm-lab/v5.0.0/publications-and-talks/talks-given-with-slm-lab","siteSpaceId":"sitesp_J00bs","emoji":"1f3a4","description":"","breadcrumbs":[{"label":"Publications and Talks","emoji":"1f4d6"}]},{"id":"kdCL36wFXgbDZGQFSqUb","title":"Deep RL Resources","pathname":"/slm-lab/v5.0.0/resources/untitled","siteSpaceId":"sitesp_J00bs","emoji":"1f4da","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"XvewkHtmblGj5g1Mtx9N","title":"Contributing","pathname":"/slm-lab/v5.0.0/resources/contributing","siteSpaceId":"sitesp_J00bs","emoji":"1f91d","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"yfxoNXNiQXWIwmpmLdlV","title":"Code of Conduct","pathname":"/slm-lab/v5.0.0/resources/code-of-conduct","siteSpaceId":"sitesp_J00bs","emoji":"1f4dc","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"JYwD5IViUhYpVofvPAjV","title":"Motivation","pathname":"/slm-lab/v5.0.0/resources/motivation","siteSpaceId":"sitesp_J00bs","emoji":"1f4a1","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"uFkQAPDkJrn45Zbl5WP8","title":"Help","pathname":"/slm-lab/v5.0.0/resources/help","siteSpaceId":"sitesp_J00bs","emoji":"2753","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"36uZa2IEfasXVXA9oWBE","title":"Contact","pathname":"/slm-lab/v5.0.0/resources/contacts","siteSpaceId":"sitesp_J00bs","emoji":"1f4e7","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"Khvk1FnPuNCDY9ZCiKA1","title":"Changelog","pathname":"/slm-lab/v5.0.0/resources/changelog","siteSpaceId":"sitesp_J00bs","emoji":"1f4dd","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"Sm0LBojOM6YYQ5xjsvHt","title":"SLM Lab","pathname":"/slm-lab/v5.1.0","siteSpaceId":"sitesp_Rfp79","description":"Modular Deep Reinforcement Learning framework in PyTorch."},{"id":"YFjTDk0cPunGDf1MvppC","title":"Installation","pathname":"/slm-lab/v5.1.0/setup/installation","siteSpaceId":"sitesp_Rfp79","emoji":"1f4e6","description":"","breadcrumbs":[{"label":"Setup","emoji":"1f5a5"}]},{"id":"y8FMgEQffw481aPwvPna","title":"Quick Start","pathname":"/slm-lab/v5.1.0/setup/quick-start","siteSpaceId":"sitesp_Rfp79","emoji":"26a1","description":"Test your installation with a quick demo.","breadcrumbs":[{"label":"Setup","emoji":"1f5a5"}]},{"id":"BmaIOeJsUjWPjFmRWzN4","title":"Train: PPO on CartPole","pathname":"/slm-lab/v5.1.0/using-slm-lab/train-ppo-cartpole","siteSpaceId":"sitesp_Rfp79","emoji":"25b6","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"uyI1vJCBvZWWuhahloVh","title":"Resume and Replay","pathname":"/slm-lab/v5.1.0/using-slm-lab/resume-and-replay","siteSpaceId":"sitesp_Rfp79","emoji":"1f504","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"5uhK9fz6R3wsz7qUJX83","title":"Core Concepts","pathname":"/slm-lab/v5.1.0/using-slm-lab/lab-organization","siteSpaceId":"sitesp_Rfp79","emoji":"1f393","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"1ylutVS5fqA1qvl0Kz9c","title":"Agent Spec","pathname":"/slm-lab/v5.1.0/using-slm-lab/agent-spec-ddqn+per-on-lunarlander","siteSpaceId":"sitesp_Rfp79","emoji":"1f916","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"nT7KH9FEow4lhyUNls4N","title":"Env Spec","pathname":"/slm-lab/v5.1.0/using-slm-lab/environment-spec-a2c-on-bipedalwalker","siteSpaceId":"sitesp_Rfp79","emoji":"1f30d","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"FC8PSbnvkhxMY6ErjtsT","title":"Meta Spec","pathname":"/slm-lab/v5.1.0/using-slm-lab/meta-spec-high-level-specifications","siteSpaceId":"sitesp_Rfp79","emoji":"2699","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"k1seizwTDZoFS3N527UR","title":"Search Spec","pathname":"/slm-lab/v5.1.0/using-slm-lab/search-spec-ppo-on-breakout","siteSpaceId":"sitesp_Rfp79","emoji":"1f50d","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"Tqstt5957xLUlCWguHCf","title":"GPU Training","pathname":"/slm-lab/v5.1.0/using-slm-lab/gpu-usage-ppo-on-pong","siteSpaceId":"sitesp_Rfp79","emoji":"1f3ae","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"gSfjM28RIzphYM7Mhr9C","title":"Remote Training","pathname":"/slm-lab/v5.1.0/using-slm-lab/remote-training","siteSpaceId":"sitesp_Rfp79","emoji":"2601","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"4HjV9BLCxL9x9I7GGh7n","title":"Async Training: Hogwild!","pathname":"/slm-lab/v5.1.0/using-slm-lab/async-training-a3c-hogwild","siteSpaceId":"sitesp_Rfp79","emoji":"26a1","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"FMRIPjAMFX2eYx8sDJ8O","title":"Running Benchmarks","pathname":"/slm-lab/v5.1.0/using-slm-lab/benchmark-specs","siteSpaceId":"sitesp_Rfp79","emoji":"1f4cb","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"xz1D2Ehvw8UOAbh7adha","title":"CLI Reference","pathname":"/slm-lab/v5.1.0/using-slm-lab/slm-lab-command","siteSpaceId":"sitesp_Rfp79","emoji":"1f4bb","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"ZtSupF33ETAECl5hlaFd","title":"Data Locations","pathname":"/slm-lab/v5.1.0/analyzing-results/analytics","siteSpaceId":"sitesp_Rfp79","emoji":"1f4c1","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"DfJAq7xxbGvkB78b7gYy","title":"Graphs and Data","pathname":"/slm-lab/v5.1.0/analyzing-results/session-graph","siteSpaceId":"sitesp_Rfp79","emoji":"1f4ca","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"JPkH7R7IKlLGC6xQLdK4","title":"TensorBoard","pathname":"/slm-lab/v5.1.0/analyzing-results/tensorboard-visualizing-models-and-actions","siteSpaceId":"sitesp_Rfp79","emoji":"1f4c9","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"HLjyjcDWWPGsPoD5UoOG","title":"Performance Metrics","pathname":"/slm-lab/v5.1.0/analyzing-results/performance-metrics","siteSpaceId":"sitesp_Rfp79","emoji":"1f3af","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"AC0jnjKqrzLAeqTGi8F5","title":"Post-Hoc Analysis","pathname":"/slm-lab/v5.1.0/analyzing-results/post-hoc-analysis","siteSpaceId":"sitesp_Rfp79","emoji":"1f52c","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"OPWKSqYF9gxaV4ePtlwF","title":"Public Benchmark Data","pathname":"/slm-lab/v5.1.0/benchmark-results/public-benchmark-data","siteSpaceId":"sitesp_Rfp79","emoji":"1f517","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"ud7Uvn55xL4SE80mIh84","title":"Discrete Benchmark","pathname":"/slm-lab/v5.1.0/benchmark-results/discrete-benchmark","siteSpaceId":"sitesp_Rfp79","emoji":"1f3af","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"bkROfPyoiplQC1yBbugf","title":"Continuous Benchmark","pathname":"/slm-lab/v5.1.0/benchmark-results/continuous-benchmark","siteSpaceId":"sitesp_Rfp79","emoji":"1f3c3","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"8KwFn8Mgctg3KmrcP1ed","title":"Atari Benchmark","pathname":"/slm-lab/v5.1.0/benchmark-results/atari-benchmark","siteSpaceId":"sitesp_Rfp79","emoji":"1f47e","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"Le9BFZkaxkwCZhXC8GVi","title":"RL GIFs","pathname":"/slm-lab/v5.1.0/benchmark-results/rl-gifs","siteSpaceId":"sitesp_Rfp79","emoji":"1f3ac","description":"Trained agents in action—watch SLM Lab's PPO and SAC algorithms play games and control robots.","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"zCyL8HCYlCclNIwpnfpg","title":"Architecture","pathname":"/slm-lab/v5.1.0/development/architecture","siteSpaceId":"sitesp_Rfp79","emoji":"1f3d7","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"gETmOTHTCrIL260307EG","title":"Modular Design","pathname":"/slm-lab/v5.1.0/development/modular-lab-components","siteSpaceId":"sitesp_Rfp79","emoji":"1f9e9","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"ZkXovFgk1MvBHH5d0gfW","title":"Algorithm Taxonomy","pathname":"/slm-lab/v5.1.0/development/modular-lab-components/algorithm-taxonomy","siteSpaceId":"sitesp_Rfp79","emoji":"1f4da","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Modular Design","emoji":"1f9e9"}]},{"id":"URKWbsITxcXVKbQUpX9N","title":"Class Inheritance: A2C > PPO","pathname":"/slm-lab/v5.1.0/development/modular-lab-components/class-inheritance-a2c-greater-than-ppo","siteSpaceId":"sitesp_Rfp79","emoji":"1f517","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Modular Design","emoji":"1f9e9"}]},{"id":"Uc5nauoBe1FfKHvcpSFE","title":"Algorithm Families","pathname":"/slm-lab/v5.1.0/development/algorithms","siteSpaceId":"sitesp_Rfp79","emoji":"1f9e0","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"JcoC6PPLXEDJclogXAHi","title":"DQN","pathname":"/slm-lab/v5.1.0/development/algorithms/dqn","siteSpaceId":"sitesp_Rfp79","emoji":"1f48e","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"hMWXVXSWZLMamAuv2WSI","title":"REINFORCE","pathname":"/slm-lab/v5.1.0/development/algorithms/reinforce","siteSpaceId":"sitesp_Rfp79","emoji":"1f3b2","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"XwXjNh6jGCrTh0EHFtGf","title":"Actor-Critic","pathname":"/slm-lab/v5.1.0/development/algorithms/a2c","siteSpaceId":"sitesp_Rfp79","emoji":"1f3ad","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"4RVUWZJi2F3ZkU4klIPz","title":"Memory","pathname":"/slm-lab/v5.1.0/development/memory","siteSpaceId":"sitesp_Rfp79","emoji":"1f4be","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"en10Uw2PPbKSG58P748y","title":"Replay","pathname":"/slm-lab/v5.1.0/development/memory/replay","siteSpaceId":"sitesp_Rfp79","emoji":"1f504","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"Qxn29g9lcrHtAGLTF3oF","title":"PrioritizedReplay","pathname":"/slm-lab/v5.1.0/development/memory/prioritizedreplay","siteSpaceId":"sitesp_Rfp79","emoji":"2b50","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"34lT6mmcXOeCqAsJmSGX","title":"OnPolicyReplay","pathname":"/slm-lab/v5.1.0/development/memory/onpolicyreplay","siteSpaceId":"sitesp_Rfp79","emoji":"1f4e4","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"Xt2tdRa8xxxLKNiMUGm4","title":"OnPolicyBatchReplay","pathname":"/slm-lab/v5.1.0/development/memory/onpolicybatchreplay","siteSpaceId":"sitesp_Rfp79","emoji":"1f4e6","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"i5FsJVoKQsmqdUTx3byx","title":"Net","pathname":"/slm-lab/v5.1.0/development/neural-networks","siteSpaceId":"sitesp_Rfp79","emoji":"1f9ec","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"Vz63a3NSw4R4fZkk2xkV","title":"MLP","pathname":"/slm-lab/v5.1.0/development/neural-networks/mlp","siteSpaceId":"sitesp_Rfp79","emoji":"1f522","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"gU1ANJtqy3OQtR2iyzf1","title":"CNN","pathname":"/slm-lab/v5.1.0/development/neural-networks/cnn","siteSpaceId":"sitesp_Rfp79","emoji":"1f5bc","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"bRfSO3BkCJxkveoBsSNc","title":"RNN","pathname":"/slm-lab/v5.1.0/development/neural-networks/rnn","siteSpaceId":"sitesp_Rfp79","emoji":"1f501","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"6dUnwNmktYkktAVR5SXP","title":"TorchArc","pathname":"/slm-lab/v5.1.0/development/neural-networks/torcharc","siteSpaceId":"sitesp_Rfp79","emoji":"1f4d0","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"jcCAE8W3VlZ9WwQcKPp8","title":"Profiling SLM Lab","pathname":"/slm-lab/v5.1.0/development/profiling-slm-lab","siteSpaceId":"sitesp_Rfp79","emoji":"23f1","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"81TBpsskBblYFwkWzyGs","title":"Using SLM Lab In Your Project","pathname":"/slm-lab/v5.1.0/development/using-slm-lab-in-your-project","siteSpaceId":"sitesp_Rfp79","emoji":"1f50c","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"kqu3GuqRSmY6WE0vcZDO","title":"Book: Foundations of Deep RL","pathname":"/slm-lab/v5.1.0/publications-and-talks/instruction-for-the-book-+-intro-to-rl-section","siteSpaceId":"sitesp_Rfp79","emoji":"1f4d5","description":"","breadcrumbs":[{"label":"Publications and Talks","emoji":"1f4d6"}]},{"id":"XBpuX6iWPpitDyzBbDxO","title":"Talks and Presentations","pathname":"/slm-lab/v5.1.0/publications-and-talks/talks-given-with-slm-lab","siteSpaceId":"sitesp_Rfp79","emoji":"1f3a4","description":"","breadcrumbs":[{"label":"Publications and Talks","emoji":"1f4d6"}]},{"id":"00w7y1Oe90ihIrsGWHIC","title":"Deep RL Resources","pathname":"/slm-lab/v5.1.0/resources/untitled","siteSpaceId":"sitesp_Rfp79","emoji":"1f4da","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"Zn4ngF8mCm6AtWTQsg4D","title":"Contributing","pathname":"/slm-lab/v5.1.0/resources/contributing","siteSpaceId":"sitesp_Rfp79","emoji":"1f91d","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"0EG4wu8V2NZvyj6D3hu8","title":"Code of Conduct","pathname":"/slm-lab/v5.1.0/resources/code-of-conduct","siteSpaceId":"sitesp_Rfp79","emoji":"1f4dc","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"kShWoKu4nM6GVn3chFXq","title":"Motivation","pathname":"/slm-lab/v5.1.0/resources/motivation","siteSpaceId":"sitesp_Rfp79","emoji":"1f4a1","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"4erhzVbsqe2QxngIfnBC","title":"Help","pathname":"/slm-lab/v5.1.0/resources/help","siteSpaceId":"sitesp_Rfp79","emoji":"2753","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"ej0N4iHSK8aXDY7IqTqI","title":"Contact","pathname":"/slm-lab/v5.1.0/resources/contacts","siteSpaceId":"sitesp_Rfp79","emoji":"1f4e7","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"yPj2b9ROusXmhAHcCWAf","title":"Changelog","pathname":"/slm-lab/v5.1.0/resources/changelog","siteSpaceId":"sitesp_Rfp79","emoji":"1f4dd","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"06xygHakPCtEMnTt8FGx","title":"SLM Lab","pathname":"/slm-lab/v5.2.0","siteSpaceId":"sitesp_5uxC0","description":"Modular Deep Reinforcement Learning framework in PyTorch."},{"id":"LU2bsCFfxLxYWr3P5MaE","title":"Installation","pathname":"/slm-lab/v5.2.0/setup/installation","siteSpaceId":"sitesp_5uxC0","emoji":"1f4e6","description":"","breadcrumbs":[{"label":"Setup","emoji":"1f5a5"}]},{"id":"BRXWxqdL31EO5Nqw8Y3m","title":"Quick Start","pathname":"/slm-lab/v5.2.0/setup/quick-start","siteSpaceId":"sitesp_5uxC0","emoji":"26a1","description":"Test your installation with a quick demo.","breadcrumbs":[{"label":"Setup","emoji":"1f5a5"}]},{"id":"cz8wBCmBLL4yLa4TR9QL","title":"Train: PPO on CartPole","pathname":"/slm-lab/v5.2.0/using-slm-lab/train-ppo-cartpole","siteSpaceId":"sitesp_5uxC0","emoji":"25b6","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"92YqoN31Pr9oRSi3475q","title":"Resume and Replay","pathname":"/slm-lab/v5.2.0/using-slm-lab/resume-and-replay","siteSpaceId":"sitesp_5uxC0","emoji":"1f504","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"QPImg7XN2qLDPw140Gug","title":"Core Concepts","pathname":"/slm-lab/v5.2.0/using-slm-lab/lab-organization","siteSpaceId":"sitesp_5uxC0","emoji":"1f393","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"OhztzrdpmHkKvptelXZ2","title":"Agent Spec","pathname":"/slm-lab/v5.2.0/using-slm-lab/agent-spec-ddqn+per-on-lunarlander","siteSpaceId":"sitesp_5uxC0","emoji":"1f916","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"OECHt3OaqAKQCwEGEdgc","title":"Env Spec","pathname":"/slm-lab/v5.2.0/using-slm-lab/environment-spec-a2c-on-bipedalwalker","siteSpaceId":"sitesp_5uxC0","emoji":"1f30d","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"K3OHGTZjoQk9Y7K2jL6h","title":"Meta Spec","pathname":"/slm-lab/v5.2.0/using-slm-lab/meta-spec-high-level-specifications","siteSpaceId":"sitesp_5uxC0","emoji":"2699","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"cw9ta4JSZJCfG4naQtJo","title":"Search Spec","pathname":"/slm-lab/v5.2.0/using-slm-lab/search-spec-ppo-on-breakout","siteSpaceId":"sitesp_5uxC0","emoji":"1f50d","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"XqXweaZk8hjgFlYfLYpi","title":"GPU Training","pathname":"/slm-lab/v5.2.0/using-slm-lab/gpu-usage-ppo-on-pong","siteSpaceId":"sitesp_5uxC0","emoji":"1f3ae","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"qbNPiYrH7xIqj5Vp4EiX","title":"Remote Training","pathname":"/slm-lab/v5.2.0/using-slm-lab/remote-training","siteSpaceId":"sitesp_5uxC0","emoji":"2601","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"FRyYnXuwfDZVRZ4y0HrF","title":"Async Training: Hogwild!","pathname":"/slm-lab/v5.2.0/using-slm-lab/async-training-a3c-hogwild","siteSpaceId":"sitesp_5uxC0","emoji":"26a1","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"9xwYQRwcFiN9DjbxeQB0","title":"Running Benchmarks","pathname":"/slm-lab/v5.2.0/using-slm-lab/benchmark-specs","siteSpaceId":"sitesp_5uxC0","emoji":"1f4cb","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"4A17OsrF0GGSJAztkEmJ","title":"CLI Reference","pathname":"/slm-lab/v5.2.0/using-slm-lab/slm-lab-command","siteSpaceId":"sitesp_5uxC0","emoji":"1f4bb","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"OsvkRyl9vATX3dX8OhTr","title":"Data Locations","pathname":"/slm-lab/v5.2.0/analyzing-results/analytics","siteSpaceId":"sitesp_5uxC0","emoji":"1f4c1","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"Ex5XSQHOWY5wdtrj6yxd","title":"Graphs and Data","pathname":"/slm-lab/v5.2.0/analyzing-results/session-graph","siteSpaceId":"sitesp_5uxC0","emoji":"1f4ca","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"MtmtGgjjue8qSpuIph9H","title":"TensorBoard","pathname":"/slm-lab/v5.2.0/analyzing-results/tensorboard-visualizing-models-and-actions","siteSpaceId":"sitesp_5uxC0","emoji":"1f4c9","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"qNwQnb0cc9SxQBF3Zjjk","title":"Performance Metrics","pathname":"/slm-lab/v5.2.0/analyzing-results/performance-metrics","siteSpaceId":"sitesp_5uxC0","emoji":"1f3af","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"MBcNTddZ6l82al4kIWnv","title":"Post-Hoc Analysis","pathname":"/slm-lab/v5.2.0/analyzing-results/post-hoc-analysis","siteSpaceId":"sitesp_5uxC0","emoji":"1f52c","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"3ZIWR6WSvaxchNqnNQsK","title":"Public Benchmark Data","pathname":"/slm-lab/v5.2.0/benchmark-results/public-benchmark-data","siteSpaceId":"sitesp_5uxC0","emoji":"1f517","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"ChsXXta19xJqZAMPg5jE","title":"Discrete Benchmark","pathname":"/slm-lab/v5.2.0/benchmark-results/discrete-benchmark","siteSpaceId":"sitesp_5uxC0","emoji":"1f3af","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"9OdU1zMW6yKmoXeRQJ7F","title":"Continuous Benchmark","pathname":"/slm-lab/v5.2.0/benchmark-results/continuous-benchmark","siteSpaceId":"sitesp_5uxC0","emoji":"1f3c3","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"d8TOPj1Tvp6WEv4FESJc","title":"Atari Benchmark","pathname":"/slm-lab/v5.2.0/benchmark-results/atari-benchmark","siteSpaceId":"sitesp_5uxC0","emoji":"1f47e","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"0Ub77sllSoGdSTPrki1h","title":"RL GIFs","pathname":"/slm-lab/v5.2.0/benchmark-results/rl-gifs","siteSpaceId":"sitesp_5uxC0","emoji":"1f3ac","description":"Trained agents in action—watch SLM Lab's PPO and SAC algorithms play games and control robots.","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"vCJuJoyzixqlMnS1AsqJ","title":"Architecture","pathname":"/slm-lab/v5.2.0/development/architecture","siteSpaceId":"sitesp_5uxC0","emoji":"1f3d7","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"oVVwq77H258BKiZJxdst","title":"Modular Design","pathname":"/slm-lab/v5.2.0/development/modular-lab-components","siteSpaceId":"sitesp_5uxC0","emoji":"1f9e9","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"9kGFPCfJA4eNdSBTCohZ","title":"Algorithm Taxonomy","pathname":"/slm-lab/v5.2.0/development/modular-lab-components/algorithm-taxonomy","siteSpaceId":"sitesp_5uxC0","emoji":"1f4da","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Modular Design","emoji":"1f9e9"}]},{"id":"yGgXxPwwLFMObGNKCkaz","title":"Class Inheritance: A2C > PPO","pathname":"/slm-lab/v5.2.0/development/modular-lab-components/class-inheritance-a2c-greater-than-ppo","siteSpaceId":"sitesp_5uxC0","emoji":"1f517","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Modular Design","emoji":"1f9e9"}]},{"id":"Y1W76bkuJeWcyiqyDfBB","title":"Algorithm Families","pathname":"/slm-lab/v5.2.0/development/algorithms","siteSpaceId":"sitesp_5uxC0","emoji":"1f9e0","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"QjrXSO4BMpocXrnIpgEU","title":"DQN","pathname":"/slm-lab/v5.2.0/development/algorithms/dqn","siteSpaceId":"sitesp_5uxC0","emoji":"1f48e","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"6BYUfwC4O0sWiq9ZAdJt","title":"REINFORCE","pathname":"/slm-lab/v5.2.0/development/algorithms/reinforce","siteSpaceId":"sitesp_5uxC0","emoji":"1f3b2","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"2KvhoBQJJQZCcfnLw1xy","title":"Actor-Critic","pathname":"/slm-lab/v5.2.0/development/algorithms/a2c","siteSpaceId":"sitesp_5uxC0","emoji":"1f3ad","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"SBsrzxzu8uzp4sDiduJ1","title":"PPO","pathname":"/slm-lab/v5.2.0/development/algorithms/a2c/ppo","siteSpaceId":"sitesp_5uxC0","emoji":"1f535","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"},{"label":"Actor-Critic","emoji":"1f3ad"}]},{"id":"hR8FUgtrgnKYKEEGb5D5","title":"SAC","pathname":"/slm-lab/v5.2.0/development/algorithms/a2c/sac","siteSpaceId":"sitesp_5uxC0","emoji":"1f525","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"},{"label":"Actor-Critic","emoji":"1f3ad"}]},{"id":"Dx8XBHWPW0O8wF2xaaxz","title":"CrossQ","pathname":"/slm-lab/v5.2.0/development/algorithms/a2c/crossq","siteSpaceId":"sitesp_5uxC0","emoji":"26a1","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"},{"label":"Actor-Critic","emoji":"1f3ad"}]},{"id":"Mz9FRxflS0FOw6X9DqyM","title":"Memory","pathname":"/slm-lab/v5.2.0/development/memory","siteSpaceId":"sitesp_5uxC0","emoji":"1f4be","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"eXvtdcK1b9jYbtUtACyy","title":"Replay","pathname":"/slm-lab/v5.2.0/development/memory/replay","siteSpaceId":"sitesp_5uxC0","emoji":"1f504","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"PC3ZhepOJu7AZvgdEyYk","title":"PrioritizedReplay","pathname":"/slm-lab/v5.2.0/development/memory/prioritizedreplay","siteSpaceId":"sitesp_5uxC0","emoji":"2b50","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"2gAw4P1JjbHPna7Dtq7h","title":"OnPolicyReplay","pathname":"/slm-lab/v5.2.0/development/memory/onpolicyreplay","siteSpaceId":"sitesp_5uxC0","emoji":"1f4e4","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"4DedGQDC6jSq6MxUEuFo","title":"OnPolicyBatchReplay","pathname":"/slm-lab/v5.2.0/development/memory/onpolicybatchreplay","siteSpaceId":"sitesp_5uxC0","emoji":"1f4e6","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"6ghpts3OZbKboZK8px0r","title":"Net","pathname":"/slm-lab/v5.2.0/development/neural-networks","siteSpaceId":"sitesp_5uxC0","emoji":"1f9ec","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"EG6C7hgyPAbHeg89ktq1","title":"MLP","pathname":"/slm-lab/v5.2.0/development/neural-networks/mlp","siteSpaceId":"sitesp_5uxC0","emoji":"1f522","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"KMLJeEgq17MsFISnIJXW","title":"CNN","pathname":"/slm-lab/v5.2.0/development/neural-networks/cnn","siteSpaceId":"sitesp_5uxC0","emoji":"1f5bc","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"evOjHYHdO07eKgV9sOs3","title":"RNN","pathname":"/slm-lab/v5.2.0/development/neural-networks/rnn","siteSpaceId":"sitesp_5uxC0","emoji":"1f501","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"cd8JF2RKMKw9xaYwQAbC","title":"TorchArc","pathname":"/slm-lab/v5.2.0/development/neural-networks/torcharc","siteSpaceId":"sitesp_5uxC0","emoji":"1f4d0","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"4tmAHGQzsze52Enbvb0D","title":"Profiling SLM Lab","pathname":"/slm-lab/v5.2.0/development/profiling-slm-lab","siteSpaceId":"sitesp_5uxC0","emoji":"23f1","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"X1jAAd4IC3KMBhcsC6sv","title":"Using SLM Lab In Your Project","pathname":"/slm-lab/v5.2.0/development/using-slm-lab-in-your-project","siteSpaceId":"sitesp_5uxC0","emoji":"1f50c","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"YY395xjZ2AjbVneEPdL0","title":"Book: Foundations of Deep RL","pathname":"/slm-lab/v5.2.0/publications-and-talks/instruction-for-the-book-+-intro-to-rl-section","siteSpaceId":"sitesp_5uxC0","emoji":"1f4d5","description":"","breadcrumbs":[{"label":"Publications and Talks","emoji":"1f4d6"}]},{"id":"QLBm2zVQSMojNbHhwR8q","title":"Talks and Presentations","pathname":"/slm-lab/v5.2.0/publications-and-talks/talks-given-with-slm-lab","siteSpaceId":"sitesp_5uxC0","emoji":"1f3a4","description":"","breadcrumbs":[{"label":"Publications and Talks","emoji":"1f4d6"}]},{"id":"xOIdBLpoOYUqEYOfbOFy","title":"Deep RL Resources","pathname":"/slm-lab/v5.2.0/resources/untitled","siteSpaceId":"sitesp_5uxC0","emoji":"1f4da","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"FEZnHlj8baDJMd4GqLD3","title":"Contributing","pathname":"/slm-lab/v5.2.0/resources/contributing","siteSpaceId":"sitesp_5uxC0","emoji":"1f91d","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"hGBMBM8dWvkXJKuR7Rib","title":"Code of Conduct","pathname":"/slm-lab/v5.2.0/resources/code-of-conduct","siteSpaceId":"sitesp_5uxC0","emoji":"1f4dc","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"YzR9JtaQo6haqgGuoNTM","title":"Motivation","pathname":"/slm-lab/v5.2.0/resources/motivation","siteSpaceId":"sitesp_5uxC0","emoji":"1f4a1","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"FEHY7dDBqo0nY0Dd9HNX","title":"Help","pathname":"/slm-lab/v5.2.0/resources/help","siteSpaceId":"sitesp_5uxC0","emoji":"2753","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"DkK3mgy6USFGhds3kWah","title":"Contact","pathname":"/slm-lab/v5.2.0/resources/contacts","siteSpaceId":"sitesp_5uxC0","emoji":"1f4e7","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"KvzlMaBt1DVv5XDXo6pp","title":"Changelog","pathname":"/slm-lab/v5.2.0/resources/changelog","siteSpaceId":"sitesp_5uxC0","emoji":"1f4dd","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"Tl0HufIrc0410HGN22kk","title":"SLM Lab","pathname":"/slm-lab","siteSpaceId":"sitesp_V9I9x","description":"Modular Deep Reinforcement Learning framework in PyTorch."},{"id":"f7Br137UPNMhryfR9pqo","title":"Installation","pathname":"/slm-lab/setup/installation","siteSpaceId":"sitesp_V9I9x","emoji":"1f4e6","description":"","breadcrumbs":[{"label":"Setup","emoji":"1f5a5"}]},{"id":"3XWoeghZsWx42Al1Kozq","title":"Quick Start","pathname":"/slm-lab/setup/quick-start","siteSpaceId":"sitesp_V9I9x","emoji":"26a1","description":"Test your installation with a quick demo.","breadcrumbs":[{"label":"Setup","emoji":"1f5a5"}]},{"id":"vr28q3cisIzC5vKgtaKE","title":"Train: PPO on CartPole","pathname":"/slm-lab/using-slm-lab/train-ppo-cartpole","siteSpaceId":"sitesp_V9I9x","emoji":"25b6","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"VySvxM0ro3fm6np0u8FG","title":"Resume and Replay","pathname":"/slm-lab/using-slm-lab/resume-and-replay","siteSpaceId":"sitesp_V9I9x","emoji":"1f504","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"T3LVQzSDktqCLN5HfgQE","title":"Core Concepts","pathname":"/slm-lab/using-slm-lab/lab-organization","siteSpaceId":"sitesp_V9I9x","emoji":"1f393","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"T8ZW3CbN9cUmNxrdtgIH","title":"Agent Spec","pathname":"/slm-lab/using-slm-lab/agent-spec-ddqn+per-on-lunarlander","siteSpaceId":"sitesp_V9I9x","emoji":"1f916","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"XA82YI31G7c6No4uHpUA","title":"Env Spec","pathname":"/slm-lab/using-slm-lab/environment-spec-a2c-on-bipedalwalker","siteSpaceId":"sitesp_V9I9x","emoji":"1f30d","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"wRxjV9G07fvocQxiKB78","title":"Meta Spec","pathname":"/slm-lab/using-slm-lab/meta-spec-high-level-specifications","siteSpaceId":"sitesp_V9I9x","emoji":"2699","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"opgbxg0Kmcy78TojKuzl","title":"Search Spec","pathname":"/slm-lab/using-slm-lab/search-spec-ppo-on-breakout","siteSpaceId":"sitesp_V9I9x","emoji":"1f50d","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"UnhCYB8IYhc1MXGuIfpG","title":"GPU Training","pathname":"/slm-lab/using-slm-lab/gpu-usage-ppo-on-pong","siteSpaceId":"sitesp_V9I9x","emoji":"1f3ae","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"jBujZ5VeSYTmF1Gl2FFz","title":"Remote Training","pathname":"/slm-lab/using-slm-lab/remote-training","siteSpaceId":"sitesp_V9I9x","emoji":"2601","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"zIAZJVpMISVBHt6xHNbv","title":"Async Training: Hogwild!","pathname":"/slm-lab/using-slm-lab/async-training-a3c-hogwild","siteSpaceId":"sitesp_V9I9x","emoji":"26a1","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"WWWhtS7mXaiVEBgvDh7Y","title":"Running Benchmarks","pathname":"/slm-lab/using-slm-lab/benchmark-specs","siteSpaceId":"sitesp_V9I9x","emoji":"1f4cb","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"GPfcZRZTxCQ5GT9Sj2YF","title":"CLI Reference","pathname":"/slm-lab/using-slm-lab/slm-lab-command","siteSpaceId":"sitesp_V9I9x","emoji":"1f4bb","description":"","breadcrumbs":[{"label":"Using SLM Lab","emoji":"1f680"}]},{"id":"SfAsuwWC0SXUFXrCinkY","title":"Data Locations","pathname":"/slm-lab/analyzing-results/analytics","siteSpaceId":"sitesp_V9I9x","emoji":"1f4c1","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"LaMgMtlKXnSA4MCJ60KF","title":"Graphs and Data","pathname":"/slm-lab/analyzing-results/session-graph","siteSpaceId":"sitesp_V9I9x","emoji":"1f4ca","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"1EhkpAOgKXVpzAo8TLiZ","title":"TensorBoard","pathname":"/slm-lab/analyzing-results/tensorboard-visualizing-models-and-actions","siteSpaceId":"sitesp_V9I9x","emoji":"1f4c9","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"JXKnbUEBZ0TsaXcuXzLW","title":"Performance Metrics","pathname":"/slm-lab/analyzing-results/performance-metrics","siteSpaceId":"sitesp_V9I9x","emoji":"1f3af","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"adDCRQqftZXuGWjQtT8y","title":"Post-Hoc Analysis","pathname":"/slm-lab/analyzing-results/post-hoc-analysis","siteSpaceId":"sitesp_V9I9x","emoji":"1f52c","description":"","breadcrumbs":[{"label":"Analyzing Results","emoji":"1f4c8"}]},{"id":"PikGaRButE5Q4Ohi3YQW","title":"Public Benchmark Data","pathname":"/slm-lab/benchmark-results/public-benchmark-data","siteSpaceId":"sitesp_V9I9x","emoji":"1f517","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"x417joK5oAnN4R62qoER","title":"Discrete Benchmark","pathname":"/slm-lab/benchmark-results/discrete-benchmark","siteSpaceId":"sitesp_V9I9x","emoji":"1f3af","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"LXAwXpoteoI2hwuhb0hE","title":"Continuous Benchmark","pathname":"/slm-lab/benchmark-results/continuous-benchmark","siteSpaceId":"sitesp_V9I9x","emoji":"1f3c3","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"3BzXxYtBUNjn6ISw6v2m","title":"Atari Benchmark","pathname":"/slm-lab/benchmark-results/atari-benchmark","siteSpaceId":"sitesp_V9I9x","emoji":"1f47e","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"8EqWW2WILbjU6NOf51cR","title":"Playground Benchmark","pathname":"/slm-lab/benchmark-results/playground-benchmark","siteSpaceId":"sitesp_V9I9x","emoji":"1f3ae","description":"","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"mFWqvFXDTJi6Nzlx9BGt","title":"RL GIFs","pathname":"/slm-lab/benchmark-results/rl-gifs","siteSpaceId":"sitesp_V9I9x","emoji":"1f3ac","description":"Trained agents in action—watch SLM Lab's PPO and SAC algorithms play games and control robots.","breadcrumbs":[{"label":"Benchmark Results","emoji":"1f947"}]},{"id":"x6VRlttMQeBBkMouLbPj","title":"Architecture","pathname":"/slm-lab/development/architecture","siteSpaceId":"sitesp_V9I9x","emoji":"1f3d7","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"jYSTBqMQ9bxCT8wDOBGx","title":"Modular Design","pathname":"/slm-lab/development/modular-lab-components","siteSpaceId":"sitesp_V9I9x","emoji":"1f9e9","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"wbwmpFPbuhsRY6b49bTx","title":"Algorithm Taxonomy","pathname":"/slm-lab/development/modular-lab-components/algorithm-taxonomy","siteSpaceId":"sitesp_V9I9x","emoji":"1f4da","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Modular Design","emoji":"1f9e9"}]},{"id":"00LbsA2KVSxUAUha8sWI","title":"Class Inheritance: A2C > PPO","pathname":"/slm-lab/development/modular-lab-components/class-inheritance-a2c-greater-than-ppo","siteSpaceId":"sitesp_V9I9x","emoji":"1f517","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Modular Design","emoji":"1f9e9"}]},{"id":"Q8FzkdPQOaW28d58gGE5","title":"Algorithm Families","pathname":"/slm-lab/development/algorithms","siteSpaceId":"sitesp_V9I9x","emoji":"1f9e0","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"GTtqmA3X8xo1js9mSbnB","title":"DQN","pathname":"/slm-lab/development/algorithms/dqn","siteSpaceId":"sitesp_V9I9x","emoji":"1f48e","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"oPmGE2PeVdq48QaO78tJ","title":"REINFORCE","pathname":"/slm-lab/development/algorithms/reinforce","siteSpaceId":"sitesp_V9I9x","emoji":"1f3b2","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"8RRVXw2AhR615Lx6YN3X","title":"Actor-Critic","pathname":"/slm-lab/development/algorithms/a2c","siteSpaceId":"sitesp_V9I9x","emoji":"1f3ad","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"}]},{"id":"kRSUiC7UHAPQIT8UYkOg","title":"PPO","pathname":"/slm-lab/development/algorithms/a2c/ppo","siteSpaceId":"sitesp_V9I9x","emoji":"1f535","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"},{"label":"Actor-Critic","emoji":"1f3ad"}]},{"id":"9rQiSoqbJs63rhqi8fF4","title":"SAC","pathname":"/slm-lab/development/algorithms/a2c/sac","siteSpaceId":"sitesp_V9I9x","emoji":"1f525","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"},{"label":"Actor-Critic","emoji":"1f3ad"}]},{"id":"bhNU8dRvcwIwjAQaanyJ","title":"CrossQ","pathname":"/slm-lab/development/algorithms/a2c/crossq","siteSpaceId":"sitesp_V9I9x","emoji":"26a1","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Algorithm Families","emoji":"1f9e0"},{"label":"Actor-Critic","emoji":"1f3ad"}]},{"id":"6R12Bz5wCYYmP47LLXPI","title":"Memory","pathname":"/slm-lab/development/memory","siteSpaceId":"sitesp_V9I9x","emoji":"1f4be","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"PZVequDSo1ZYYf2SziPT","title":"Replay","pathname":"/slm-lab/development/memory/replay","siteSpaceId":"sitesp_V9I9x","emoji":"1f504","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"KYjOW5bvTGYLvUvYitcl","title":"PrioritizedReplay","pathname":"/slm-lab/development/memory/prioritizedreplay","siteSpaceId":"sitesp_V9I9x","emoji":"2b50","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"7DyIvQG7mmnwVZTw0Oi1","title":"OnPolicyReplay","pathname":"/slm-lab/development/memory/onpolicyreplay","siteSpaceId":"sitesp_V9I9x","emoji":"1f4e4","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"YO2XkK531hT7uiTw8FIV","title":"OnPolicyBatchReplay","pathname":"/slm-lab/development/memory/onpolicybatchreplay","siteSpaceId":"sitesp_V9I9x","emoji":"1f4e6","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Memory","emoji":"1f4be"}]},{"id":"cZsdhIlX9ZkfHMVoLEdR","title":"Net","pathname":"/slm-lab/development/neural-networks","siteSpaceId":"sitesp_V9I9x","emoji":"1f9ec","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"C9Qba3qJepWSJMFyoyQv","title":"MLP","pathname":"/slm-lab/development/neural-networks/mlp","siteSpaceId":"sitesp_V9I9x","emoji":"1f522","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"E9TRTr4m0MaG7vyDIyOE","title":"CNN","pathname":"/slm-lab/development/neural-networks/cnn","siteSpaceId":"sitesp_V9I9x","emoji":"1f5bc","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"FqsKhgUuNp33d1XK0vXS","title":"RNN","pathname":"/slm-lab/development/neural-networks/rnn","siteSpaceId":"sitesp_V9I9x","emoji":"1f501","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"9eLXPkNRXSZT5IdnKK11","title":"TorchArc","pathname":"/slm-lab/development/neural-networks/torcharc","siteSpaceId":"sitesp_V9I9x","emoji":"1f4d0","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"},{"label":"Net","emoji":"1f9ec"}]},{"id":"qnPhApLxN4i9KapWxP1u","title":"Profiling SLM Lab","pathname":"/slm-lab/development/profiling-slm-lab","siteSpaceId":"sitesp_V9I9x","emoji":"23f1","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"b2HLY5aybtPDBndZMLZj","title":"Using SLM Lab In Your Project","pathname":"/slm-lab/development/using-slm-lab-in-your-project","siteSpaceId":"sitesp_V9I9x","emoji":"1f50c","description":"","breadcrumbs":[{"label":"Development","emoji":"1f527"}]},{"id":"rNxg6ItC5OGaPO41dG3r","title":"Book: Foundations of Deep RL","pathname":"/slm-lab/publications-and-talks/instruction-for-the-book-+-intro-to-rl-section","siteSpaceId":"sitesp_V9I9x","emoji":"1f4d5","description":"","breadcrumbs":[{"label":"Publications and Talks","emoji":"1f4d6"}]},{"id":"N3i0o9SWW1hHhzjr0f3K","title":"Talks and Presentations","pathname":"/slm-lab/publications-and-talks/talks-given-with-slm-lab","siteSpaceId":"sitesp_V9I9x","emoji":"1f3a4","description":"","breadcrumbs":[{"label":"Publications and Talks","emoji":"1f4d6"}]},{"id":"9sDxbU0ok69Jvrasym1q","title":"Deep RL Resources","pathname":"/slm-lab/resources/untitled","siteSpaceId":"sitesp_V9I9x","emoji":"1f4da","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"rvo7wAKEV5QFS4NOHjjt","title":"Contributing","pathname":"/slm-lab/resources/contributing","siteSpaceId":"sitesp_V9I9x","emoji":"1f91d","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"adqOzxyfxdE2322amLPl","title":"Code of Conduct","pathname":"/slm-lab/resources/code-of-conduct","siteSpaceId":"sitesp_V9I9x","emoji":"1f4dc","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"h6vH3D2M9vN2jX3VpViJ","title":"Motivation","pathname":"/slm-lab/resources/motivation","siteSpaceId":"sitesp_V9I9x","emoji":"1f4a1","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"1dHH0DLuasOUhlGf91q7","title":"Help","pathname":"/slm-lab/resources/help","siteSpaceId":"sitesp_V9I9x","emoji":"2753","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"MpJaFCFnO7KuI3gkFBi2","title":"Contact","pathname":"/slm-lab/resources/contacts","siteSpaceId":"sitesp_V9I9x","emoji":"1f4e7","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]},{"id":"KGq2sChvL4xgWmqfwkbo","title":"Changelog","pathname":"/slm-lab/resources/changelog","siteSpaceId":"sitesp_V9I9x","emoji":"1f4dd","description":"","breadcrumbs":[{"label":"Resources","emoji":"1f913"}]}]}