LICENSE
LICENSE.txt
README.md
setup.py
openrl/__init__.py
openrl.egg-info/PKG-INFO
openrl.egg-info/SOURCES.txt
openrl.egg-info/dependency_links.txt
openrl.egg-info/entry_points.txt
openrl.egg-info/requires.txt
openrl.egg-info/top_level.txt
openrl/algorithms/__init__.py
openrl/algorithms/base_algorithm.py
openrl/algorithms/dqn.py
openrl/algorithms/ppo.py
openrl/buffers/__init__.py
openrl/buffers/normal_buffer.py
openrl/buffers/offpolicy_buffer.py
openrl/buffers/offpolicy_replay_data.py
openrl/buffers/replay_data.py
openrl/buffers/utils/__init__.py
openrl/buffers/utils/obs_data.py
openrl/buffers/utils/util.py
openrl/cli/__init__.py
openrl/cli/cli.py
openrl/cli/train.py
openrl/configs/__init__.py
openrl/configs/config.py
openrl/drivers/__init__.py
openrl/drivers/base_driver.py
openrl/drivers/offpolicy_driver.py
openrl/drivers/onpolicy_driver.py
openrl/drivers/rl_driver.py
openrl/envs/__init__.py
openrl/envs/common/__init__.py
openrl/envs/common/build_envs.py
openrl/envs/common/registration.py
openrl/envs/gymnasium/__init__.py
openrl/envs/mpe/__init__.py
openrl/envs/mpe/core.py
openrl/envs/mpe/mpe_env.py
openrl/envs/mpe/multi_discrete.py
openrl/envs/mpe/multiagent_env.py
openrl/envs/mpe/rendering.py
openrl/envs/mpe/scenario.py
openrl/envs/mpe/scenarios/__init__.py
openrl/envs/mpe/scenarios/simple_spread.py
openrl/envs/nlp/__init__.py
openrl/envs/nlp/daily_dialog_env.py
openrl/envs/nlp/nlp_env.py
openrl/envs/nlp/utils/__init__.py
openrl/envs/nlp/utils/custom_text_generation_pools.py
openrl/envs/nlp/utils/distribution.py
openrl/envs/nlp/utils/evaluation_utils.py
openrl/envs/nlp/utils/observation.py
openrl/envs/nlp/utils/sampler.py
openrl/envs/nlp/utils/text_generation_pool.py
openrl/envs/nlp/utils/metrics/__init__.py
openrl/envs/nlp/utils/metrics/meteor.py
openrl/envs/super_mario/__init__.py
openrl/envs/super_mario/super_mario_convert.py
openrl/envs/vec_env/__init__.py
openrl/envs/vec_env/async_venv.py
openrl/envs/vec_env/base_venv.py
openrl/envs/vec_env/sync_venv.py
openrl/envs/vec_env/utils/__init__.py
openrl/envs/vec_env/utils/numpy_utils.py
openrl/envs/vec_env/utils/share_memory.py
openrl/envs/vec_env/utils/util.py
openrl/envs/vec_env/vec_info/__init__.py
openrl/envs/vec_env/vec_info/base_vec_info.py
openrl/envs/vec_env/vec_info/nlp_vec_info.py
openrl/envs/vec_env/vec_info/simple_vec_info.py
openrl/envs/vec_env/wrappers/__init__.py
openrl/envs/vec_env/wrappers/base_wrapper.py
openrl/envs/vec_env/wrappers/reward_wrapper.py
openrl/envs/vec_env/wrappers/vec_monitor_wrapper.py
openrl/envs/wrappers/__init__.py
openrl/envs/wrappers/base_wrapper.py
openrl/envs/wrappers/extra_wrappers.py
openrl/envs/wrappers/multiagent_wrapper.py
openrl/envs/wrappers/util.py
openrl/modules/__init__.py
openrl/modules/base_module.py
openrl/modules/dqn_module.py
openrl/modules/model_config.py
openrl/modules/ppo_module.py
openrl/modules/rl_module.py
openrl/modules/common/__init__.py
openrl/modules/common/base_net.py
openrl/modules/common/dqn_net.py
openrl/modules/common/ppo_net.py
openrl/modules/networks/__init__.py
openrl/modules/networks/base_policy_network.py
openrl/modules/networks/base_value_network.py
openrl/modules/networks/policy_network.py
openrl/modules/networks/policy_value_network.py
openrl/modules/networks/policy_value_network_gpt.py
openrl/modules/networks/q_network.py
openrl/modules/networks/value_network.py
openrl/modules/networks/utils/__init__.py
openrl/modules/networks/utils/act.py
openrl/modules/networks/utils/attention.py
openrl/modules/networks/utils/cnn.py
openrl/modules/networks/utils/distributed_utils.py
openrl/modules/networks/utils/distributions.py
openrl/modules/networks/utils/mix.py
openrl/modules/networks/utils/mlp.py
openrl/modules/networks/utils/popart.py
openrl/modules/networks/utils/rnn.py
openrl/modules/networks/utils/transformer_act.py
openrl/modules/networks/utils/util.py
openrl/modules/networks/utils/nlp/__init__.py
openrl/modules/networks/utils/nlp/base_policy.py
openrl/modules/networks/utils/nlp/causal_policy.py
openrl/modules/networks/utils/nlp/hf_generation_utils.py
openrl/modules/utils/__init__.py
openrl/modules/utils/util.py
openrl/modules/utils/valuenorm.py
openrl/rewards/__init__.py
openrl/rewards/base_reward.py
openrl/rewards/nlp_reward.py
openrl/runners/__init__.py
openrl/runners/common/__init__.py
openrl/runners/common/base_agent.py
openrl/runners/common/chat_agent.py
openrl/runners/common/dqn_agent.py
openrl/runners/common/ppo_agent.py
openrl/runners/common/rl_agent.py
openrl/supports/__init__.py
openrl/supports/opendata/__init__.py
openrl/supports/opendata/utils/__init__.py
openrl/supports/opendata/utils/opendata_utils.py
openrl/supports/opengpu/__init__.py
openrl/supports/opengpu/gpu_info.py
openrl/supports/opengpu/manager.py
openrl/utils/__init__.py
openrl/utils/logger.py
openrl/utils/util.py
tests/__init__.py
tests/project/__init__.py
tests/project/test_version.py
tests/test_buffer/__init__.py
tests/test_buffer/test_buffer.py