├── README.md ├── agents ├── __init__.py ├── __pycache__ │ ├── __init__.cpython-35.pyc │ └── __init__.cpython-37.pyc ├── common │ ├── __init__.py │ ├── __pycache__ │ │ ├── __init__.cpython-35.pyc │ │ ├── __init__.cpython-37.pyc │ │ ├── common.cpython-35.pyc │ │ ├── common_cpr.cpython-35.pyc │ │ ├── common_ddpg.cpython-35.pyc │ │ ├── common_dqn.cpython-35.pyc │ │ ├── common_msbcb.cpython-35.pyc │ │ ├── common_msbcb.cpython-37.pyc │ │ └── common_ppo.cpython-35.pyc │ ├── common.py │ ├── common_cpr.py │ ├── common_ddpg.py │ ├── common_dqn.py │ ├── common_msbcb.py │ └── common_ppo.py ├── constrained_ddpg.py ├── constrained_dqn.py ├── constrained_ppo.py ├── contextual_bandit.py ├── greedy_with_ddpg.py ├── greedy_with_dqn.py ├── greedy_with_max_cpr.py ├── greedy_with_ppo.py ├── msbcb.py └── offline_optimal.py ├── figures_for_paper ├── .DS_Store ├── __init__.py ├── figures.py └── figures_appendix.py ├── plot_util ├── __init__.py ├── __pycache__ │ ├── __init__.cpython-35.pyc │ └── tf_log.cpython-35.pyc └── tf_log.py ├── replay_buffer ├── __init__.py ├── __pycache__ │ ├── __init__.cpython-35.pyc │ ├── bid_replay_buffer.cpython-35.pyc │ ├── replay_buffer.cpython-35.pyc │ ├── segment_tree.cpython-35.pyc │ └── utils.cpython-35.pyc ├── bid_replay_buffer.py ├── priority_queue_buffer.py ├── replay_buffer.py ├── segment_tree.py ├── trajectory_replay_buffer.py └── utils.py ├── requirements.txt └── simulation_env ├── __init__.py ├── __pycache__ ├── __init__.cpython-35.pyc ├── __init__.cpython-36.pyc ├── multiuser_env.cpython-35.pyc ├── multiuser_env_cmdp.cpython-35.pyc ├── multiuser_env_cmdp.cpython-36.pyc └── utils.cpython-35.pyc ├── multiuser_env.py ├── multiuser_env_cmdp.py ├── multiuser_env_v0.py └── utils.py /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/README.md -------------------------------------------------------------------------------- /agents/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /agents/__pycache__/__init__.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/__pycache__/__init__.cpython-35.pyc -------------------------------------------------------------------------------- /agents/__pycache__/__init__.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/__pycache__/__init__.cpython-37.pyc -------------------------------------------------------------------------------- /agents/common/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /agents/common/__pycache__/__init__.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/__pycache__/__init__.cpython-35.pyc -------------------------------------------------------------------------------- /agents/common/__pycache__/__init__.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/__pycache__/__init__.cpython-37.pyc -------------------------------------------------------------------------------- /agents/common/__pycache__/common.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/__pycache__/common.cpython-35.pyc -------------------------------------------------------------------------------- /agents/common/__pycache__/common_cpr.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/__pycache__/common_cpr.cpython-35.pyc -------------------------------------------------------------------------------- /agents/common/__pycache__/common_ddpg.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/__pycache__/common_ddpg.cpython-35.pyc -------------------------------------------------------------------------------- /agents/common/__pycache__/common_dqn.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/__pycache__/common_dqn.cpython-35.pyc -------------------------------------------------------------------------------- /agents/common/__pycache__/common_msbcb.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/__pycache__/common_msbcb.cpython-35.pyc -------------------------------------------------------------------------------- /agents/common/__pycache__/common_msbcb.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/__pycache__/common_msbcb.cpython-37.pyc -------------------------------------------------------------------------------- /agents/common/__pycache__/common_ppo.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/__pycache__/common_ppo.cpython-35.pyc -------------------------------------------------------------------------------- /agents/common/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/common.py -------------------------------------------------------------------------------- /agents/common/common_cpr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/common_cpr.py -------------------------------------------------------------------------------- /agents/common/common_ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/common_ddpg.py -------------------------------------------------------------------------------- /agents/common/common_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/common_dqn.py -------------------------------------------------------------------------------- /agents/common/common_msbcb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/common_msbcb.py -------------------------------------------------------------------------------- /agents/common/common_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/common/common_ppo.py -------------------------------------------------------------------------------- /agents/constrained_ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/constrained_ddpg.py -------------------------------------------------------------------------------- /agents/constrained_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/constrained_dqn.py -------------------------------------------------------------------------------- /agents/constrained_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/constrained_ppo.py -------------------------------------------------------------------------------- /agents/contextual_bandit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/contextual_bandit.py -------------------------------------------------------------------------------- /agents/greedy_with_ddpg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/greedy_with_ddpg.py -------------------------------------------------------------------------------- /agents/greedy_with_dqn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/greedy_with_dqn.py -------------------------------------------------------------------------------- /agents/greedy_with_max_cpr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/greedy_with_max_cpr.py -------------------------------------------------------------------------------- /agents/greedy_with_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/greedy_with_ppo.py -------------------------------------------------------------------------------- /agents/msbcb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/msbcb.py -------------------------------------------------------------------------------- /agents/offline_optimal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/agents/offline_optimal.py -------------------------------------------------------------------------------- /figures_for_paper/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/figures_for_paper/.DS_Store -------------------------------------------------------------------------------- /figures_for_paper/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /figures_for_paper/figures.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/figures_for_paper/figures.py -------------------------------------------------------------------------------- /figures_for_paper/figures_appendix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/figures_for_paper/figures_appendix.py -------------------------------------------------------------------------------- /plot_util/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /plot_util/__pycache__/__init__.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/plot_util/__pycache__/__init__.cpython-35.pyc -------------------------------------------------------------------------------- /plot_util/__pycache__/tf_log.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/plot_util/__pycache__/tf_log.cpython-35.pyc -------------------------------------------------------------------------------- /plot_util/tf_log.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/plot_util/tf_log.py -------------------------------------------------------------------------------- /replay_buffer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /replay_buffer/__pycache__/__init__.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/__pycache__/__init__.cpython-35.pyc -------------------------------------------------------------------------------- /replay_buffer/__pycache__/bid_replay_buffer.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/__pycache__/bid_replay_buffer.cpython-35.pyc -------------------------------------------------------------------------------- /replay_buffer/__pycache__/replay_buffer.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/__pycache__/replay_buffer.cpython-35.pyc -------------------------------------------------------------------------------- /replay_buffer/__pycache__/segment_tree.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/__pycache__/segment_tree.cpython-35.pyc -------------------------------------------------------------------------------- /replay_buffer/__pycache__/utils.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/__pycache__/utils.cpython-35.pyc -------------------------------------------------------------------------------- /replay_buffer/bid_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/bid_replay_buffer.py -------------------------------------------------------------------------------- /replay_buffer/priority_queue_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/priority_queue_buffer.py -------------------------------------------------------------------------------- /replay_buffer/replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/replay_buffer.py -------------------------------------------------------------------------------- /replay_buffer/segment_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/segment_tree.py -------------------------------------------------------------------------------- /replay_buffer/trajectory_replay_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/trajectory_replay_buffer.py -------------------------------------------------------------------------------- /replay_buffer/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/replay_buffer/utils.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/requirements.txt -------------------------------------------------------------------------------- /simulation_env/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /simulation_env/__pycache__/__init__.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/__pycache__/__init__.cpython-35.pyc -------------------------------------------------------------------------------- /simulation_env/__pycache__/__init__.cpython-36.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/__pycache__/__init__.cpython-36.pyc -------------------------------------------------------------------------------- /simulation_env/__pycache__/multiuser_env.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/__pycache__/multiuser_env.cpython-35.pyc -------------------------------------------------------------------------------- /simulation_env/__pycache__/multiuser_env_cmdp.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/__pycache__/multiuser_env_cmdp.cpython-35.pyc -------------------------------------------------------------------------------- /simulation_env/__pycache__/multiuser_env_cmdp.cpython-36.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/__pycache__/multiuser_env_cmdp.cpython-36.pyc -------------------------------------------------------------------------------- /simulation_env/__pycache__/utils.cpython-35.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/__pycache__/utils.cpython-35.pyc -------------------------------------------------------------------------------- /simulation_env/multiuser_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/multiuser_env.py -------------------------------------------------------------------------------- /simulation_env/multiuser_env_cmdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/multiuser_env_cmdp.py -------------------------------------------------------------------------------- /simulation_env/multiuser_env_v0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/multiuser_env_v0.py -------------------------------------------------------------------------------- /simulation_env/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tjuHaoXiaotian/ICML-2020-MSBCB/HEAD/simulation_env/utils.py --------------------------------------------------------------------------------