salil-malhotra
commited on
Commit
·
8042e00
1
Parent(s):
963ca6d
Upload PPO LunarLander-v2 trained agent
Browse files- README.md +2 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +2 -2
- ppo-LunarLander-v2/data +24 -24
- ppo-LunarLander-v2/policy.optimizer.pth +1 -1
- ppo-LunarLander-v2/policy.pth +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
README.md
CHANGED
@@ -10,7 +10,7 @@ model-index:
|
|
10 |
results:
|
11 |
- metrics:
|
12 |
- type: mean_reward
|
13 |
-
value:
|
14 |
name: mean_reward
|
15 |
task:
|
16 |
type: reinforcement-learning
|
@@ -24,6 +24,7 @@ model-index:
|
|
24 |
|
25 |
|
26 |
|
|
|
27 |
# **PPO** Agent playing **LunarLander-v2**
|
28 |
This is a trained model of a **PPO** agent playing **LunarLander-v2** using the [stable-baselines3 library](https://github.com/DLR-RM/stable-baselines3).
|
29 |
|
|
|
10 |
results:
|
11 |
- metrics:
|
12 |
- type: mean_reward
|
13 |
+
value: 270.94 +/- 27.90
|
14 |
name: mean_reward
|
15 |
task:
|
16 |
type: reinforcement-learning
|
|
|
24 |
|
25 |
|
26 |
|
27 |
+
|
28 |
# **PPO** Agent playing **LunarLander-v2**
|
29 |
This is a trained model of a **PPO** agent playing **LunarLander-v2** using the [stable-baselines3 library](https://github.com/DLR-RM/stable-baselines3).
|
30 |
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x0000012B49ED34C0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x0000012B49ED3550>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x0000012B49ED35E0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x0000012B49ED3670>", "_build": "<function ActorCriticPolicy._build at 0x0000012B49ED3700>", "forward": "<function ActorCriticPolicy.forward at 0x0000012B49ED3790>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x0000012B49ED3820>", "_predict": "<function ActorCriticPolicy._predict at 0x0000012B49ED38B0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x0000012B49ED3940>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x0000012B49ED39D0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x0000012B49ED3A60>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x0000012B49ED2180>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVngEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBXNoYXBllEsIhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSwiFlIwBQ5R0lFKUjARoaWdolGgSKJYgAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lGgKSwiFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWCAAAAAAAAAAAAAAAAAAAAJRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZRoFXSUUpSMDWJvdW5kZWRfYWJvdmWUaBIolggAAAAAAAAAAAAAAAAAAACUaCFLCIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVgQAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc2hhcGWUKYwFZHR5cGWUjAVudW1weZRoB5OUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE51Yi4=", "n": 4, "shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 524288, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652212264.8089247, "learning_rate": 0.0003, "tensorboard_log": "tmp/", "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVkQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGFDOlxVc2Vyc1xtYWxoc2FsXGRldlxkYmNvbmRhLTIwMjFfMDUtcHkzOC1yMzZcbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgNdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALOx5r24vtY4GRwAvAz1QLydPtS61zexOwAAAAAAAAAAAFATPSmMbjkLUom8rCgJPe20sbrLBWq8AAAAAAAAgD+aXNs85IG2PtUmUL7dYI6+psmkPNatpr0AAAAAAAAAAJrMobwUvI266Io8PDsyHrXEYai6vtERtAAAgD8AAIA/ZjB2vQoXPjjNmjq8MMHBPHT4FrpZXxi8AACAPwAAgD+aBZq8uNbwuaiZ+Trfp6C1ge4LOls0n7QAAIA/AACAP2ZFGz09Og65veuNu7ul0rTICLU7X3lJNAAAgD8AAIA/ihTIvhkAEj/WYlU+w7Gavgx6Tb67LVA+AAAAAAAAAACa06a8KTBHumoTnbq8KL+01sDCus+QtzkAAIA/AACAP6BLCL7DkUa6/f5tOnsLOzh9xuE7L2AyuQAAgD8AAIA/mpcfvPLqAD5Aa+M8sA8gvrPTDD0zJDI9AAAAAAAAAACaFwo8KUAxurMyObrsCXi4hR/5ucqOYDkAAIA/AACAPzMDS7yP3km69EeoPEWF0bjD7127s2rOtwAAgD8AAIA/mgXVPcNpGTtx3QG+mcttvpCDAL0EeRA9AAAAAAAAAAATfQ6+7LW1u+4ipbvggtm5dkoNPauHuDoAAIA/AACAPwBsizuu+ZK63+ZKutOYL7VBadW6RftqOQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.04857599999999995, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVfRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIpfW3BOD0WUCUhpRSlIwBbJRN6AOMAXSUR0CmDbwC8vmHdX2UKGgGaAloD0MIrfpcbcUSYECUhpRSlGgVTegDaBZHQKYOpJYkmhN1fZQoaAZoCWgPQwg2yY/4FXdRQJSGlFKUaBVN6ANoFkdApg/oGyHEdnV9lChoBmgJaA9DCIxIFFrWKF1AlIaUUpRoFU3oA2gWR0CmEbMunMt9dX2UKGgGaAloD0MI/YUeMXoxZUCUhpRSlGgVTegDaBZHQKYUv+85CF91fZQoaAZoCWgPQwggmQ6dnlBZQJSGlFKUaBVN6ANoFkdAphfm/QBxP3V9lChoBmgJaA9DCGk7pu7KKlxAlIaUUpRoFU3oA2gWR0CmGKN5D7ZWdX2UKGgGaAloD0MIVvXyO00KYECUhpRSlGgVTegDaBZHQKYZtKT0QK91fZQoaAZoCWgPQwh6ihwi7kZgQJSGlFKUaBVN6ANoFkdAphm10HQhOnV9lChoBmgJaA9DCAbaHVIMYlRAlIaUUpRoFU3oA2gWR0CmGqqx9oexdX2UKGgGaAloD0MI1F+vsODAYECUhpRSlGgVTegDaBZHQKYc83eenQ91fZQoaAZoCWgPQwgKhnMNMwFcQJSGlFKUaBVN6ANoFkdAph5OcriEQHV9lChoBmgJaA9DCD24O2u3d1dAlIaUUpRoFU3oA2gWR0CmHyRaxHG0dX2UKGgGaAloD0MI+UhKehg4TUCUhpRSlGgVS8hoFkdApiAIv8IiT3V9lChoBmgJaA9DCLFuvDsyvltAlIaUUpRoFU3oA2gWR0CmICxLCemOdX2UKGgGaAloD0MI16axvRa8XkCUhpRSlGgVTegDaBZHQKYjGEq2Brh1fZQoaAZoCWgPQwhPP6iLFJZkQJSGlFKUaBVN6ANoFkdApiP7awljVnV9lChoBmgJaA9DCHV4COMnRmJAlIaUUpRoFU3oA2gWR0CmM1DaGpMpdX2UKGgGaAloD0MIHvmDgeflWUCUhpRSlGgVTegDaBZHQKY0OW0qpcZ1fZQoaAZoCWgPQwiNKO0Nvm5fQJSGlFKUaBVN6ANoFkdApjVXtY0VJ3V9lChoBmgJaA9DCLTHC+nwqGBAlIaUUpRoFU3oA2gWR0CmNxmvOhTPdX2UKGgGaAloD0MIDvPlBVjRYECUhpRSlGgVTegDaBZHQKY6oBDohZB1fZQoaAZoCWgPQwgR34lZL2BgQJSGlFKUaBVN6ANoFkdApj2X5ckdFXV9lChoBmgJaA9DCDF5A8x851tAlIaUUpRoFU3oA2gWR0CmP6sMRYigdX2UKGgGaAloD0MId6BOeXTzXECUhpRSlGgVTegDaBZHQKY/rLpzLfV1fZQoaAZoCWgPQwgYd4NorahTQJSGlFKUaBVN6ANoFkdApkB/c32mHnV9lChoBmgJaA9DCPUsCOV9bV9AlIaUUpRoFU3oA2gWR0CmQmEUCaJAdX2UKGgGaAloD0MInkSEfxGUVkCUhpRSlGgVTegDaBZHQKZDbqUNayN1fZQoaAZoCWgPQwiaCYZzjVJhQJSGlFKUaBVN6ANoFkdApkQs0FbFCXV9lChoBmgJaA9DCNSAQdKnNV1AlIaUUpRoFU3oA2gWR0CmRSkXcgyNdX2UKGgGaAloD0MIttlYiXnQW0CUhpRSlGgVTegDaBZHQKZFUWiUPhB1fZQoaAZoCWgPQwjYDkbsEyJZQJSGlFKUaBVN6ANoFkdApkg5p5/smnV9lChoBmgJaA9DCGvY74l1oF5AlIaUUpRoFU3oA2gWR0CmSQ1aW5YpdX2UKGgGaAloD0MIqS9LO7U3YUCUhpRSlGgVTegDaBZHQKZ1y9B8hLZ1fZQoaAZoCWgPQwgGgCpu3HBWQJSGlFKUaBVN6ANoFkdApnacZNwiq3V9lChoBmgJaA9DCMqJdhVSKF5AlIaUUpRoFU3oA2gWR0Cmd6quSwGGdX2UKGgGaAloD0MIWwcHexNDYUCUhpRSlGgVTegDaBZHQKZ5NcWTHKh1fZQoaAZoCWgPQwgTmiSWFHxjQJSGlFKUaBVN6ANoFkdApnv0JdB0IXV9lChoBmgJaA9DCIZxN4jWz2JAlIaUUpRoFU3oA2gWR0CmfqGUwBYFdX2UKGgGaAloD0MI78ouGFzZYkCUhpRSlGgVTegDaBZHQKaAQm3vx6R1fZQoaAZoCWgPQwhSDJBogixgQJSGlFKUaBVN6ANoFkdApoBDmW+oL3V9lChoBmgJaA9DCAH8U6pEo19AlIaUUpRoFU3oA2gWR0CmgRoRAbADdX2UKGgGaAloD0MIv7m/etxSX0CUhpRSlGgVTegDaBZHQKaDHjENvwV1fZQoaAZoCWgPQwgtYAK3btpgQJSGlFKUaBVN6ANoFkdApoRP9UCJXXV9lChoBmgJaA9DCNfZkH/ms2FAlIaUUpRoFU3oA2gWR0CmhSyjQAuJdX2UKGgGaAloD0MIxJPdzOgrXECUhpRSlGgVTegDaBZHQKaGN4M4LkV1fZQoaAZoCWgPQwi6FcJqrGtjQJSGlFKUaBVN6ANoFkdApoZZkTYdyXV9lChoBmgJaA9DCOY7+ImDXmRAlIaUUpRoFU3oA2gWR0CmiOKSPluFdX2UKGgGaAloD0MIx9XIrrRSXUCUhpRSlGgVTegDaBZHQKaJsn4wh4d1fZQoaAZoCWgPQwh4Qq8/iUlbQJSGlFKUaBVN6ANoFkdAppfGVRk3CXV9lChoBmgJaA9DCNP58CxB1GBAlIaUUpRoFU3oA2gWR0CmmKRR/EwWdX2UKGgGaAloD0MIAyLElbMCWUCUhpRSlGgVTegDaBZHQKaZsJ3PiUB1fZQoaAZoCWgPQwizKOyiaANgQJSGlFKUaBVN6ANoFkdApps4xzq8lHV9lChoBmgJaA9DCNO+ub96mGVAlIaUUpRoFU3oA2gWR0CmnfUZWJaadX2UKGgGaAloD0MI6glLPKDQY0CUhpRSlGgVTegDaBZHQKagSuloDgZ1fZQoaAZoCWgPQwi6FcJqLEEGwJSGlFKUaBVL0WgWR0CmoJcVgx8EdX2UKGgGaAloD0MI1uHoKl0lYUCUhpRSlGgVTegDaBZHQKah5DWsijd1fZQoaAZoCWgPQwhN9zqpL5RcQJSGlFKUaBVN6ANoFkdApqHjVjI7vHV9lChoBmgJaA9DCMOedvjrd2BAlIaUUpRoFU3oA2gWR0CmootIK+i8dX2UKGgGaAloD0MIo1aYvtcgZkCUhpRSlGgVTegDaBZHQKakEyOaOPx1fZQoaAZoCWgPQwiWW1oNifRjQJSGlFKUaBVN6ANoFkdApqULlLeyiXV9lChoBmgJaA9DCDjYmxgSWGRAlIaUUpRoFU3oA2gWR0CmpaD0L+gldX2UKGgGaAloD0MIg/jAjv/tX0CUhpRSlGgVTegDaBZHQKamb/CIk7h1fZQoaAZoCWgPQwhT6pJxjJRVQJSGlFKUaBVN6ANoFkdApqaTd+G47XV9lChoBmgJaA9DCBAlWvJ4iWBAlIaUUpRoFU3oA2gWR0CmqNxy4nWrdX2UKGgGaAloD0MIdArys5HAXUCUhpRSlGgVTegDaBZHQKapuCwr1/V1fZQoaAZoCWgPQwg+l6lJ8NhdQJSGlFKUaBVN6ANoFkdApthr2+PBBXV9lChoBmgJaA9DCNvAHahTXmBAlIaUUpRoFU3oA2gWR0Cm2UfhuO0cdX2UKGgGaAloD0MIr1sExvoUXUCUhpRSlGgVTegDaBZHQKbb4/tY0VJ1fZQoaAZoCWgPQwjex9EcWYBgQJSGlFKUaBVN6ANoFkdApt8TxZuAJHV9lChoBmgJaA9DCOs1PSgoDWZAlIaUUpRoFU3oA2gWR0Cm4c9Q40djdX2UKGgGaAloD0MI/Ul87gQ3WkCUhpRSlGgVTegDaBZHQKbiKExIre91fZQoaAZoCWgPQwiUFFgA06NhQJSGlFKUaBVN6ANoFkdApuNlwvQF93V9lChoBmgJaA9DCCdnKO74emRAlIaUUpRoFU3oA2gWR0Cm42dxIatLdX2UKGgGaAloD0MIgBDJkOM4ZECUhpRSlGgVTegDaBZHQKbkRHkLhJl1fZQoaAZoCWgPQwgGSDSBom9hQJSGlFKUaBVN6ANoFkdApuZaBshxHXV9lChoBmgJaA9DCAx3Loz0tV1AlIaUUpRoFU3oA2gWR0Cm52sH8jzJdX2UKGgGaAloD0MIweCaO/rJWUCUhpRSlGgVTegDaBZHQKboGZML4N91fZQoaAZoCWgPQwhyNbIrLRVgQJSGlFKUaBVN6ANoFkdApujMhA4XGnV9lChoBmgJaA9DCG6/fLJicFRAlIaUUpRoFU3oA2gWR0Cm6OP3rUsndX2UKGgGaAloD0MIv5gtWZV/Y0CUhpRSlGgVTegDaBZHQKbrIe3hGYt1fZQoaAZoCWgPQwgv/OB86kVlQJSGlFKUaBVN6ANoFkdApuvamKqGUXV9lChoBmgJaA9DCMmOjUA8SHBAlIaUUpRoFU00AmgWR0Cm8iWWY4Q0dX2UKGgGaAloD0MIxAjh0cbvYkCUhpRSlGgVTegDaBZHQKb4qn2qT8p1fZQoaAZoCWgPQwgclZuoJdZjQJSGlFKUaBVN6ANoFkdApvmAlIEr5XV9lChoBmgJaA9DCAUWwJSBdGVAlIaUUpRoFU3oA2gWR0Cm+/xY7q6fdX2UKGgGaAloD0MIXJIDdjV4W0CUhpRSlGgVTegDaBZHQKb+72dNFjN1fZQoaAZoCWgPQwgJwD+lSlJeQJSGlFKUaBVN6ANoFkdApwHWzposZ3V9lChoBmgJaA9DCLJIE++Ah2JAlIaUUpRoFU3oA2gWR0CnAybDEWIodX2UKGgGaAloD0MI+YIWErAdYECUhpRSlGgVTegDaBZHQKcDJ+6RQrN1fZQoaAZoCWgPQwisxDwr6V9lQJSGlFKUaBVN6ANoFkdApwPWEIw/PnV9lChoBmgJaA9DCOJ1/YLdOVhAlIaUUpRoFU3oA2gWR0CnBblaKUFCdX2UKGgGaAloD0MI2/eov15kWkCUhpRSlGgVTegDaBZHQKcG117pmmN1fZQoaAZoCWgPQwikN9xHbjBhQJSGlFKUaBVN6ANoFkdApwd3Td+G5HV9lChoBmgJaA9DCCSZ1Tvcz2FAlIaUUpRoFU3oA2gWR0CnCE6k690zdX2UKGgGaAloD0MISIld21tjYkCUhpRSlGgVTegDaBZHQKcIdehPCVN1fZQoaAZoCWgPQwiunSgJiWZCQJSGlFKUaBVL4mgWR0CnCaNA1NxmdX2UKGgGaAloD0MIWcLaGDvTTUCUhpRSlGgVS+poFkdApwnSXpnpS3V9lChoBmgJaA9DCJHRAUnY8mJAlIaUUpRoFU3oA2gWR0CnCroMrmQsdX2UKGgGaAloD0MIgPEMGvq7YUCUhpRSlGgVTegDaBZHQKcLbS/CZWt1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 128, "n_steps": 2048, "gamma": 0.998, "gae_lambda": 0.97, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 8, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVkQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGFDOlxVc2Vyc1xtYWxoc2FsXGRldlxkYmNvbmRhLTIwMjFfMDUtcHkzOC1yMzZcbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgNdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "target_kl": null, "system_info": {"OS": "Windows-10-10.0.18362-SP0 10.0.18362", "Python": "3.8.8", "Stable-Baselines3": "1.4.0", "PyTorch": "1.11.0", "GPU Enabled": "False", "Numpy": "1.20.1", "Gym": "0.19.0"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x0000021F61AE31F0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x0000021F61AE3280>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x0000021F61AE3310>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x0000021F61AE33A0>", "_build": "<function ActorCriticPolicy._build at 0x0000021F61AE3430>", "forward": "<function ActorCriticPolicy.forward at 0x0000021F61AE34C0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x0000021F61AE3550>", "_predict": "<function ActorCriticPolicy._predict at 0x0000021F61AE35E0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x0000021F61AE3670>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x0000021F61AE3700>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x0000021F61AE3790>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x0000021F61AD8D20>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVJQwAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBXNoYXBllEsIhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSwiFlIwBQ5R0lFKUjARoaWdolGgSKJYgAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lGgKSwiFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWCAAAAAAAAAAAAAAAAAAAAJRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZRoFXSUUpSMDWJvdW5kZWRfYWJvdmWUaBIolggAAAAAAAAAAAAAAAAAAACUaCFLCIWUaBV0lFKUjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBJfX3JhbmRvbXN0YXRlX2N0b3KUk5SMB01UMTk5MzeUhZRSlH2UKIwNYml0X2dlbmVyYXRvcpRoMIwFc3RhdGWUfZQojANrZXmUaBIolsAJAAAAAAAAgIYUuA51sC9/GaBAogWdT4aqPn/BNJuTKl5lpSyWTe5iRbx8HC1lKMMgblSSrAaw2HUGsWL9dmmoeM1BusXYG7L0gga0EfncHTzE7o1dUgaUmtTfIu7urWTopXFtXLBY9SvG/n/RpeNcI70bjcq1vSVxue5Y97vURA12iLkLbbOrytk+SV42OVyxK8Pra+XeXX6APZXhdnpndSAh4I2JY/bQm33sXarpzVnDSvZX/1bO2S1t0p4mnFjmNAGC+TSTF0905Tg3RGVC4X6b6pD+UOLvKsAdeZ/5N8089fxJCLB/y7nPUk69iNihFvS99x9ki+wfYa38Rld/eF/xkNKfEzWoefsnDtWYDa0WrM2lwDux10HFpl9Wh0lGoDFu1tnGPZRnLYTX6MZ3KMGqZuaDcvYcZCfyKJ3VdNBMAJyTlKJ5giNx+9jRCil5opqfYSPSGInrOmCTtSasF8jQ6WHel8aguaLOlUomQ18hWPI4g8BYkn62+SU+usK+Wi27JlaUfdUQOe/TjZTkGkf0NZYXEoPcPcG94iy72DeKsq+lec6S5KXsvWSI3JflabUmyvh1o9WgHBoYYzPjmHCJ/zncyHbKc1+qG1Ad7XzEZLcUeasdqtsThYpX4Pu29CmzmKoQuaAxhFo4ZLXbt3SCMzxPkFR4WDFaUE/ZervcfjHx53KWrnjCA4F6ncA8FUXJYIErKYajOoMrqbedPs7ZbDepmRvPCUP/t7We0iFj1vw2FGKsjdf0OeNwbHdibbiop1B2iJytURXxxYmz1F1RIyEiwUX20PC908fEVdxJW8oO9gyXgcV+UWfu0CuNpDw7sEoFt81oo6pQe2yNFyun8JA4xK1Bq14sK/d92MAiMLdOEz8CwCf3L2ZIy02r6Az9hRBJuFVaz727HjSBhdMgn6p7Xr2lNOQBBoo+3BdlrJIW0ZstmBCMhDRns0QvUHMzrMrhPYE4dQsPMF+sxbF2Dx+MZdauzWlbcdVrdTN9d2UN0c2BBDUx6lFJ3sRZfEHLJ7OkppCs/bAyjrfHI/7sG4YvO4ZOPxrL3Y/S2KW3sIKRdvldi43SPunKhL4nktEAmKDvxP9WdP/v66LPSrUzjN5tswmHjKuUZw/avRXO3RIFBBHtEGbRqRU6RQD15DLZft0HwyfVZwN9CZ1cXarOOCQrPPn28h7KTHujKCTYg0MnWBlC9S/6XNVxNZhbIbnR4aH6a+WCrlwFn2qeDzA1pcyrxM/teWS2s1l3Y9xiXpyzjaVUJEiGtXV9BEmEstjzF+d/0EAAG2LEUW/mbxx/R43ms9HJcBeYz3ixvSNzXVerz3RT557h9g9lox5PuVWAP4aZbYE4y3+LkGQFjwea2FE68RXWjslWeyrRUlirXhMNV8/jGB9UtJgFLva7Y99573/FZ1M9R4JWxQvveKN2sp4+vON6/tKv+C2n+oYH8jJquQeFA3sWMKMS4fCbXoH+4lhkd6ktywESpdChW8eC7ScUe9v2VUwauFQtBKgCznvUBw9tfMJGTj7xfneeILl6XuUxjeyE/8PHrHcU1tVws72T9azGKjd+TgYoKiL5/+hbuQqtEWJ775Xi7oB0Fk7zwP4B3Mq08+n84Xmn0au8IG1muYj/bAzAA5/7VtqaBjw0FevbigkyxpArqXyDcLt5pvXLsKXu0+3H7ciX2vUAyrRa39boEVT52ZhrerGdv9wBvDvJaI0beMFSAZMZ1i7bPoNY2+/X9aNjwAJE4yQD4XDye69o8vGY43/jTqDE7RXePK9VA5bnFIAyfJyq/QLHtTE6VyMNOsrTQfUYKR5iv5rtlGhEnWbgOZOmzfLclPQhjTkZsCgiUZB81Zh02Rgr0w0hehkfVGJxQjn80V4kEpTK1192EY8MzlikiyDETXIJ8WjA0FO8DAG+ZdErUSVM7I+jvtBAvEhUQmnPRMmswi/ya4yCy86+4l3peuwvUHMTFaTKd0cyr1gkj3ILHIa0EaAOTH4emhwtYmTsWiJa+RJVdL2BvJplVrLawbYJfSFsh+ZWLcxVKsyeTkhdn48AAd0qad+BX44rBH7VN24yYrn/YK0AyDS1afAw7WbgS1EqqPNkBAGju0sm+aHL7xR+eAK/MnKaFQSIu5rIB2klOhv4uiNWDGrZhqshF8/IJ4s0bYYsTBzJaYdAFHqSxRz6LI5QEEHnSQCrZcpIsKAd2/AZ3lEoNgroxtmvSyLdElXSWlqqmDFIERLxDWyXHCOXOShzQgf4xCPovCkVhv/14ASMzwPLCeLM6RwDWiiuBHAeFmsH43GHhVa1nUqT/Xjc5jqoCz3yJgBQeAP3DUz9jYvc2aO0CiEAyKcIgicZpehq+AK+iVoGgqvTF7ez3+VJo8b1xI0LkxyTgSrOvQpW0K6D7gEFPNGCmTL+2vDfD69UP8UWUT+0EGDR/fo/LGG5hXDIDBGwPsDc+YS9bUxDWiCz31Lq9VPoJfZGAE6AlOB9NxCX+0MW8BACF6LzIcHDoYU5XPte2muwb/IoRES7qkesxmC6aRTyD0J7SpPDETz4gkxDa/06fsq6JBKkk9nL9xjAnMRfTZ1l/PFSPyw97s0IiCjhw9qLZ0AMTypdVf70ZbnzbOxH+b/RQLhKPXJIv0YdDd+VgpKEoyCaZ6DdKkeTCTJeukL/v2p+zeatD9I6wB3zpZd7uAxAXB4p0C70QLSOZV8tS8NBkKqlT4wMuY1f3KJFhOfnHbQPtah01DoLU6LVnxh9raXLKqX6QzrGlqhU/Z37WG+2k6Qq6UsqqX/Pl6cpKGT8ZHDOExab387CTCIc7tar9kFjWOS1i5utrKI1dp4PFpWD4F0UyRSVAbdqt+foVuMrgNrjS/+K/yYhXdSr5sQLohS78a0616L1FEkb1R257ifBU630BWvKrdhRNxZykeG5Wb0HaOcQNdvnJ+aGzewRdbU+qPuvW4evru1Iu6Udygxr3hQmzHu5OgSgSYPL9t3z9DCXr+M+nrOCzX0vBepdjMNEOkalFDsWi28yzcNbFGFh3OZ+gZpifvCh5NOS0tX37m/VxYc2evsssjjXSncfOSX8n+LCaD3DS8UAIfaoOOt6QmLfpgg7Yj79GjqLFxoKDOKeB0gbvul2ucu4bsa7lopQZKQ2a2fpx5EJOC8mXmjAh0CDui42kLPSig532rH8gEyZh6/2BJZxpN2x+rfQhmRDsInKHpvqkleyjkpU+2JTilM+NqGMYVa0RqXiA2btczw10/F5OCk9vIr3N8kS0alw1LLdbWewJi82llzOwZGZ76p4VmCNyEtfAk4wz3K4ER0RCG02XHrBA9q/qe5Us6ckxh78UWNyMZBJlGgHjAJ1NJSJiIeUUpQoSwNoC05OTkr/////Sv////9LAHSUYk1wAoWUaBV0lFKUjANwb3OUSxx1jAloYXNfZ2F1c3OUSwCMBWdhdXNzlEcAAAAAAAAAAHVidWIu", "dtype": "float32", "shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": "RandomState(MT19937)"}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVgQAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc2hhcGWUKYwFZHR5cGWUjAVudW1weZRoB5OUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE51Yi4=", "n": 4, "shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652303687.7713685, "learning_rate": 0.0003, "tensorboard_log": "tmp/", "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVkQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGFDOlxVc2Vyc1xtYWxoc2FsXGRldlxkYmNvbmRhLTIwMjFfMDUtcHkzOC1yMzZcbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgNdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGbG9DopwC+6+WzGOg8LZzYXPT86+tHluQAAgD8AAIA/zdCdPFyjJrpG5xk59zbctcqzMDoPxC64AACAPwAAgD8zi7O79nKYP52NSbwvwRu/CrFtvILHjj0AAAAAAAAAAJqRprt7FIc3qtXTOt55EzV7DCA7sj8BugAAgD8AAIA/mvtOPcOFDbpeV1Y4HyAStVi0uTv7g3q3AACAPwAAgD8zmxQ7XONYuo9pHTtEu601MPwAuH7ONboAAIA/AACAP81RZz0KFwO5nVPmvIDQcTQn46Q7iFz+swAAgD8AAIA/mhAmvSkoZ7qwHF86SZ6ENRTxQbpsJoC5AACAPwAAgD8aq1O94TibPcMt4L3sJFG+x0sRvtAoWb0AAAAAAAAAAA36oT32jEy6AsaGO+uujjjF7pk62poeugAAgD8AAIA/MxXavClQObpTRJg7aUYeONO5MDpKs8m3AACAPwAAgD+A1xW9KYBmurNlkjud1Og4+Fs3Osw+LroAAIA/AACAP3CC374r7GU/LJivvnpHEr89Lea+Wie4vAAAAAAAAAAAM0OVPbFl1z1K8le4YBd4vqf+szzj+ne8AAAAAAAAAADAbpi95QGDP0fOi74kpR2/J4givciUPrwAAAAAAAAAAAZCj761R4k+WN7RPgDjhb5uiR69+72bPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVdxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIIlD9g0jqYkCUhpRSlIwBbJRN6AOMAXSUR0CcMJJqqOtGdX2UKGgGaAloD0MIQ/6ZQXxASUCUhpRSlGgVS6xoFkdAnDMnoxHoYHV9lChoBmgJaA9DCCEHJcy0dWJAlIaUUpRoFU3oA2gWR0CcNKT9KmKqdX2UKGgGaAloD0MIF3/bEyTpaUCUhpRSlGgVTegDaBZHQJw3GE4//vR1fZQoaAZoCWgPQwgOv5tu2WdkQJSGlFKUaBVN6ANoFkdAnEDnCKrJbXV9lChoBmgJaA9DCG/W4H3V/GdAlIaUUpRoFU3oA2gWR0CcQanYg7o0dX2UKGgGaAloD0MILjpZaj0qZ0CUhpRSlGgVTegDaBZHQJxC2oIfKZF1fZQoaAZoCWgPQwggtYmT+wNOwJSGlFKUaBVNSwJoFkdAnEMDvNNahnV9lChoBmgJaA9DCEmfVtGfUGZAlIaUUpRoFU3oA2gWR0CcSFRSgoPTdX2UKGgGaAloD0MIaoZUUTy8ZUCUhpRSlGgVTegDaBZHQJxI+UD+zdF1fZQoaAZoCWgPQwitiJro8+tRQJSGlFKUaBVLwWgWR0CcS7rZ8KG+dX2UKGgGaAloD0MIy5wui4kdO0CUhpRSlGgVS7poFkdAnEyY+W4Vh3V9lChoBmgJaA9DCGGm7V9ZamhAlIaUUpRoFU3oA2gWR0CcTl7btZ3cdX2UKGgGaAloD0MI7upVZPSQYkCUhpRSlGgVTegDaBZHQJxOugvlEJB1fZQoaAZoCWgPQwiKPEm65ghkQJSGlFKUaBVN6ANoFkdAnE9Y1+AmRnV9lChoBmgJaA9DCJDZWfTOqmVAlIaUUpRoFU3oA2gWR0CcT2radtl7dX2UKGgGaAloD0MIwoTRrGxxQsCUhpRSlGgVTQgBaBZHQJxQD8aXKKZ1fZQoaAZoCWgPQwie0OtPYodiQJSGlFKUaBVN6ANoFkdAnF0iKWLP2XV9lChoBmgJaA9DCPN0riglz2ZAlIaUUpRoFU3oA2gWR0CcXgNgBtDVdX2UKGgGaAloD0MIpkV9kjt/ZUCUhpRSlGgVTegDaBZHQJxkrU4JeE91fZQoaAZoCWgPQwgbf6KyYfBnQJSGlFKUaBVN6ANoFkdAnGcpSvTw2HV9lChoBmgJaA9DCKd1G9R+z2JAlIaUUpRoFU3oA2gWR0CcaG1stTUBdX2UKGgGaAloD0MIKEnXTL7MaECUhpRSlGgVTegDaBZHQJxqstqYZ2p1fZQoaAZoCWgPQwgbEYyDy7dmQJSGlFKUaBVN6ANoFkdAnHUWTot+TnV9lChoBmgJaA9DCG/Tn/3ITGBAlIaUUpRoFU3oA2gWR0Ccffa7VawEdX2UKGgGaAloD0MI8NsQ4zWkZkCUhpRSlGgVTegDaBZHQJx+xOIqLCN1fZQoaAZoCWgPQwguHAjJgkFlQJSGlFKUaBVN6ANoFkdAnKlPJA+pwXV9lChoBmgJaA9DCONsOgK4CGVAlIaUUpRoFU3oA2gWR0CcqlaAFxGUdX2UKGgGaAloD0MIAn6NJMFgY0CUhpRSlGgVTegDaBZHQJysWk2xY7t1fZQoaAZoCWgPQwgtJ6H0BcJlQJSGlFKUaBVN6ANoFkdAnKzet0V8C3V9lChoBmgJaA9DCFX2XRH8EGVAlIaUUpRoFU3oA2gWR0CcrX3Q2MsIdX2UKGgGaAloD0MIvMtFfCdGYECUhpRSlGgVTegDaBZHQJytn9R77bd1fZQoaAZoCWgPQwg2j8Ngfq5qQJSGlFKUaBVN6ANoFkdAnK40vXbudHV9lChoBmgJaA9DCJC93v3xbmVAlIaUUpRoFU3oA2gWR0CcvQzH0btJdX2UKGgGaAloD0MIeAyP/SzXZ0CUhpRSlGgVTegDaBZHQJy+ByvLX+V1fZQoaAZoCWgPQwh2weCaO9hlQJSGlFKUaBVN6ANoFkdAnMTl8XvYvnV9lChoBmgJaA9DCCS05VwKBmVAlIaUUpRoFU3oA2gWR0Ccx3/PPcBVdX2UKGgGaAloD0MIPBOaJJaJZkCUhpRSlGgVTegDaBZHQJzI1Bv73wl1fZQoaAZoCWgPQwjuW60TF85gQJSGlFKUaBVN6ANoFkdAnMseIAOrhnV9lChoBmgJaA9DCC8yAb/G8mNAlIaUUpRoFU3oA2gWR0Cc1ejfNzKcdX2UKGgGaAloD0MIzZVBtUESZkCUhpRSlGgVTegDaBZHQJzfLBAOav11fZQoaAZoCWgPQwhsdw/QfWNjQJSGlFKUaBVN6ANoFkdAnOAO1KGtZHV9lChoBmgJaA9DCDGyZI5ltWRAlIaUUpRoFU3oA2gWR0Cc43U83dbgdX2UKGgGaAloD0MIwAZEiCujY0CUhpRSlGgVTegDaBZHQJzkY2CNCJJ1fZQoaAZoCWgPQwgK16NwvTtlQJSGlFKUaBVN6ANoFkdAnOZWx2SuAHV9lChoBmgJaA9DCAdCsoAJcGRAlIaUUpRoFU3oA2gWR0Cc5saVlf7adX2UKGgGaAloD0MIuYybGmgyZ0CUhpRSlGgVTegDaBZHQJznZV4oqkN1fZQoaAZoCWgPQwi6u86G/FFkQJSGlFKUaBVN6ANoFkdAnOd3YcvM83V9lChoBmgJaA9DCOksswhF0WRAlIaUUpRoFU3oA2gWR0Cc6BxPfsNUdX2UKGgGaAloD0MIeCXJc30vUECUhpRSlGgVS7NoFkdAnO+uLrHEM3V9lChoBmgJaA9DCIygMZOo9GVAlIaUUpRoFU3oA2gWR0Cc9zIk7fYSdX2UKGgGaAloD0MIxTh/EwqgYUCUhpRSlGgVTegDaBZHQJz4PJ6po9N1fZQoaAZoCWgPQwgw9IjR8wdjQJSGlFKUaBVN6ANoFkdAnQAb6xgRb3V9lChoBmgJaA9DCO/FF+3xT2VAlIaUUpRoFU3oA2gWR0CdAu8SPEKmdX2UKGgGaAloD0MIggAZOnbgXkCUhpRSlGgVTegDaBZHQJ0Ela3Zwn91fZQoaAZoCWgPQwh5k9+ik/1jQJSGlFKUaBVN6ANoFkdAnQdbgsK9f3V9lChoBmgJaA9DCAbxgR3/4GRAlIaUUpRoFU3oA2gWR0CdExj7hvR7dX2UKGgGaAloD0MIbW+3JIf1Z0CUhpRSlGgVTegDaBZHQJ0c7FHavid1fZQoaAZoCWgPQwj7H2Ct2uRkQJSGlFKUaBVN6ANoFkdAnR2/FaSs83V9lChoBmgJaA9DCFThz/DmwmVAlIaUUpRoFU3oA2gWR0CdISW2PT5PdX2UKGgGaAloD0MIuTmVDABaZECUhpRSlGgVTegDaBZHQJ0iLRCx/ut1fZQoaAZoCWgPQwiXjc75qdxlQJSGlFKUaBVN6ANoFkdAnUzwtJ4B3nV9lChoBmgJaA9DCOZatABt4GZAlIaUUpRoFU3oA2gWR0CdTXUiY9gXdX2UKGgGaAloD0MITFXa4hoQZUCUhpRSlGgVTegDaBZHQJ1OE//vOQh1fZQoaAZoCWgPQwgF3V7SGP9iQJSGlFKUaBVN6ANoFkdAnU7fnfVI7XV9lChoBmgJaA9DCFzjM9k/pFBAlIaUUpRoFUvCaBZHQJ1TYifQKKJ1fZQoaAZoCWgPQwhAvRk1X105QJSGlFKUaBVLrWgWR0CdVsH1OCXhdX2UKGgGaAloD0MI7x01JkRJZ0CUhpRSlGgVTegDaBZHQJ1XKw5eZ5R1fZQoaAZoCWgPQwjz5JoCmYBnQJSGlFKUaBVN6ANoFkdAnV0nUUfxMHV9lChoBmgJaA9DCH1AoDNpmGhAlIaUUpRoFU3oA2gWR0CdXgiI+GGmdX2UKGgGaAloD0MIwYwpWOMfZUCUhpRSlGgVTegDaBZHQJ1j5LUTcqR1fZQoaAZoCWgPQwheLXdmgsBjQJSGlFKUaBVN6ANoFkdAnWZQ9eQdS3V9lChoBmgJaA9DCGWKOQg61mRAlIaUUpRoFU3oA2gWR0CdZ7msvIwNdX2UKGgGaAloD0MI6lp7n6opZ0CUhpRSlGgVTegDaBZHQJ1p2nrIHTt1fZQoaAZoCWgPQwg6IXTQJdlTQJSGlFKUaBVLrGgWR0Cdb2p2ECeVdX2UKGgGaAloD0MI3sZmRyqDZkCUhpRSlGgVTegDaBZHQJ10FMWXTmZ1fZQoaAZoCWgPQwiNRj6v+PBmQJSGlFKUaBVN6ANoFkdAnX1DgAIY33V9lChoBmgJaA9DCAfRWtHmp2VAlIaUUpRoFU3oA2gWR0Cdfg0G/vfCdX2UKGgGaAloD0MIRUlIpO09ZkCUhpRSlGgVTegDaBZHQJ2CBNFjNIN1fZQoaAZoCWgPQwjg9ZmzPoFlQJSGlFKUaBVN6ANoFkdAnYQIMfA9FHV9lChoBmgJaA9DCDWYhuGj1GNAlIaUUpRoFU3oA2gWR0CdhIyfL9uQdX2UKGgGaAloD0MI6zao/VYxaECUhpRSlGgVTegDaBZHQJ2F9vVEuxt1fZQoaAZoCWgPQwh/ox03/D1hQJSGlFKUaBVN6ANoFkdAnYsjLSuyNXV9lChoBmgJaA9DCKkT0ETYHWVAlIaUUpRoFU3oA2gWR0CdjhwcHWz4dX2UKGgGaAloD0MILPNWXYfwZkCUhpRSlGgVTegDaBZHQJ2OkJMQEp11fZQoaAZoCWgPQwjFcHUARFVkQJSGlFKUaBVN6ANoFkdAnZTPYvnKXHV9lChoBmgJaA9DCJKwbycRYWVAlIaUUpRoFU3oA2gWR0CdlYwpe/pMdX2UKGgGaAloD0MIBmUaTS6gZECUhpRSlGgVTegDaBZHQJ2boRSP2f11fZQoaAZoCWgPQwgHlbiOcZljQJSGlFKUaBVN6ANoFkdAnZ/JWV/tpnV9lChoBmgJaA9DCH9rJ0rCrWVAlIaUUpRoFU3oA2gWR0CdolE+gUUPdX2UKGgGaAloD0MIxqLp7GTvZkCUhpRSlGgVTegDaBZHQJ2oljurp7l1fZQoaAZoCWgPQwi+FB40u/hSQJSGlFKUaBVLtWgWR0Cdqr0gKWszdX2UKGgGaAloD0MIih9j7toqYUCUhpRSlGgVTegDaBZHQJ2tbnoxHoZ1fZQoaAZoCWgPQwhSZRh3g8JRQJSGlFKUaBVLq2gWR0Cds2WGRFI/dX2UKGgGaAloD0MIBwq8k08gXECUhpRSlGgVTegDaBZHQJ22/yH2ys11fZQoaAZoCWgPQwiNmq+SD3NiQJSGlFKUaBVN6ANoFkdAnbfmjGkvb3V9lChoBmgJaA9DCGiyf54GhEpAlIaUUpRoFUulaBZHQJ24sBhhH9Z1fZQoaAZoCWgPQwhOKhprf/tfQJSGlFKUaBVN6ANoFkdAnbxpElVtGnV9lChoBmgJaA9DCLt868P6n2NAlIaUUpRoFU3oA2gWR0CdvoER8MNMdX2UKGgGaAloD0MIineAJ63vZECUhpRSlGgVTegDaBZHQJ2/BX2dupF1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 736, "n_steps": 2048, "gamma": 0.998, "gae_lambda": 0.995, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 256, "n_epochs": 16, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVkQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGFDOlxVc2Vyc1xtYWxoc2FsXGRldlxkYmNvbmRhLTIwMjFfMDUtcHkzOC1yMzZcbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgNdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "target_kl": null, "system_info": {"OS": "Windows-10-10.0.18362-SP0 10.0.18362", "Python": "3.8.8", "Stable-Baselines3": "1.4.0", "PyTorch": "1.11.0", "GPU Enabled": "False", "Numpy": "1.20.1", "Gym": "0.19.0"}}
|
ppo-LunarLander-v2.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6ee88eb1b3c9c708eff0760a1addb754447b987614f2643e5d9301b4f2333db
|
3 |
+
size 147174
|
ppo-LunarLander-v2/data
CHANGED
@@ -4,25 +4,25 @@
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
11 |
-
"_build": "<function ActorCriticPolicy._build at
|
12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
13 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
14 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
15 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
16 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
17 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
18 |
"__abstractmethods__": "frozenset()",
|
19 |
-
"_abc_impl": "<_abc_data object at
|
20 |
},
|
21 |
"verbose": 1,
|
22 |
"policy_kwargs": {},
|
23 |
"observation_space": {
|
24 |
":type:": "<class 'gym.spaces.box.Box'>",
|
25 |
-
":serialized:": "
|
26 |
"dtype": "float32",
|
27 |
"shape": [
|
28 |
8
|
@@ -31,7 +31,7 @@
|
|
31 |
"high": "[inf inf inf inf inf inf inf inf]",
|
32 |
"bounded_below": "[False False False False False False False False]",
|
33 |
"bounded_above": "[False False False False False False False False]",
|
34 |
-
"_np_random":
|
35 |
},
|
36 |
"action_space": {
|
37 |
":type:": "<class 'gym.spaces.discrete.Discrete'>",
|
@@ -42,12 +42,12 @@
|
|
42 |
"_np_random": null
|
43 |
},
|
44 |
"n_envs": 16,
|
45 |
-
"num_timesteps":
|
46 |
-
"_total_timesteps":
|
47 |
"_num_timesteps_at_start": 0,
|
48 |
"seed": null,
|
49 |
"action_noise": null,
|
50 |
-
"start_time":
|
51 |
"learning_rate": 0.0003,
|
52 |
"tensorboard_log": "tmp/",
|
53 |
"lr_schedule": {
|
@@ -56,7 +56,7 @@
|
|
56 |
},
|
57 |
"_last_obs": {
|
58 |
":type:": "<class 'numpy.ndarray'>",
|
59 |
-
":serialized:": "
|
60 |
},
|
61 |
"_last_episode_starts": {
|
62 |
":type:": "<class 'numpy.ndarray'>",
|
@@ -66,24 +66,24 @@
|
|
66 |
"_episode_num": 0,
|
67 |
"use_sde": false,
|
68 |
"sde_sample_freq": -1,
|
69 |
-
"_current_progress_remaining": -0.
|
70 |
"ep_info_buffer": {
|
71 |
":type:": "<class 'collections.deque'>",
|
72 |
-
":serialized:": "
|
73 |
},
|
74 |
"ep_success_buffer": {
|
75 |
":type:": "<class 'collections.deque'>",
|
76 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
77 |
},
|
78 |
-
"_n_updates":
|
79 |
"n_steps": 2048,
|
80 |
"gamma": 0.998,
|
81 |
-
"gae_lambda": 0.
|
82 |
"ent_coef": 0.01,
|
83 |
"vf_coef": 0.5,
|
84 |
"max_grad_norm": 0.5,
|
85 |
-
"batch_size":
|
86 |
-
"n_epochs":
|
87 |
"clip_range": {
|
88 |
":type:": "<class 'function'>",
|
89 |
":serialized:": "gAWVkQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGFDOlxVc2Vyc1xtYWxoc2FsXGRldlxkYmNvbmRhLTIwMjFfMDUtcHkzOC1yMzZcbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgNdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x0000021F61AE31F0>",
|
8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x0000021F61AE3280>",
|
9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x0000021F61AE3310>",
|
10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x0000021F61AE33A0>",
|
11 |
+
"_build": "<function ActorCriticPolicy._build at 0x0000021F61AE3430>",
|
12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x0000021F61AE34C0>",
|
13 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x0000021F61AE3550>",
|
14 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x0000021F61AE35E0>",
|
15 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x0000021F61AE3670>",
|
16 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x0000021F61AE3700>",
|
17 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x0000021F61AE3790>",
|
18 |
"__abstractmethods__": "frozenset()",
|
19 |
+
"_abc_impl": "<_abc_data object at 0x0000021F61AD8D20>"
|
20 |
},
|
21 |
"verbose": 1,
|
22 |
"policy_kwargs": {},
|
23 |
"observation_space": {
|
24 |
":type:": "<class 'gym.spaces.box.Box'>",
|
25 |
+
":serialized:": "gAWVJQwAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBXNoYXBllEsIhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSwiFlIwBQ5R0lFKUjARoaWdolGgSKJYgAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lGgKSwiFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWCAAAAAAAAAAAAAAAAAAAAJRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZRoFXSUUpSMDWJvdW5kZWRfYWJvdmWUaBIolggAAAAAAAAAAAAAAAAAAACUaCFLCIWUaBV0lFKUjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBJfX3JhbmRvbXN0YXRlX2N0b3KUk5SMB01UMTk5MzeUhZRSlH2UKIwNYml0X2dlbmVyYXRvcpRoMIwFc3RhdGWUfZQojANrZXmUaBIolsAJAAAAAAAAgIYUuA51sC9/GaBAogWdT4aqPn/BNJuTKl5lpSyWTe5iRbx8HC1lKMMgblSSrAaw2HUGsWL9dmmoeM1BusXYG7L0gga0EfncHTzE7o1dUgaUmtTfIu7urWTopXFtXLBY9SvG/n/RpeNcI70bjcq1vSVxue5Y97vURA12iLkLbbOrytk+SV42OVyxK8Pra+XeXX6APZXhdnpndSAh4I2JY/bQm33sXarpzVnDSvZX/1bO2S1t0p4mnFjmNAGC+TSTF0905Tg3RGVC4X6b6pD+UOLvKsAdeZ/5N8089fxJCLB/y7nPUk69iNihFvS99x9ki+wfYa38Rld/eF/xkNKfEzWoefsnDtWYDa0WrM2lwDux10HFpl9Wh0lGoDFu1tnGPZRnLYTX6MZ3KMGqZuaDcvYcZCfyKJ3VdNBMAJyTlKJ5giNx+9jRCil5opqfYSPSGInrOmCTtSasF8jQ6WHel8aguaLOlUomQ18hWPI4g8BYkn62+SU+usK+Wi27JlaUfdUQOe/TjZTkGkf0NZYXEoPcPcG94iy72DeKsq+lec6S5KXsvWSI3JflabUmyvh1o9WgHBoYYzPjmHCJ/zncyHbKc1+qG1Ad7XzEZLcUeasdqtsThYpX4Pu29CmzmKoQuaAxhFo4ZLXbt3SCMzxPkFR4WDFaUE/ZervcfjHx53KWrnjCA4F6ncA8FUXJYIErKYajOoMrqbedPs7ZbDepmRvPCUP/t7We0iFj1vw2FGKsjdf0OeNwbHdibbiop1B2iJytURXxxYmz1F1RIyEiwUX20PC908fEVdxJW8oO9gyXgcV+UWfu0CuNpDw7sEoFt81oo6pQe2yNFyun8JA4xK1Bq14sK/d92MAiMLdOEz8CwCf3L2ZIy02r6Az9hRBJuFVaz727HjSBhdMgn6p7Xr2lNOQBBoo+3BdlrJIW0ZstmBCMhDRns0QvUHMzrMrhPYE4dQsPMF+sxbF2Dx+MZdauzWlbcdVrdTN9d2UN0c2BBDUx6lFJ3sRZfEHLJ7OkppCs/bAyjrfHI/7sG4YvO4ZOPxrL3Y/S2KW3sIKRdvldi43SPunKhL4nktEAmKDvxP9WdP/v66LPSrUzjN5tswmHjKuUZw/avRXO3RIFBBHtEGbRqRU6RQD15DLZft0HwyfVZwN9CZ1cXarOOCQrPPn28h7KTHujKCTYg0MnWBlC9S/6XNVxNZhbIbnR4aH6a+WCrlwFn2qeDzA1pcyrxM/teWS2s1l3Y9xiXpyzjaVUJEiGtXV9BEmEstjzF+d/0EAAG2LEUW/mbxx/R43ms9HJcBeYz3ixvSNzXVerz3RT557h9g9lox5PuVWAP4aZbYE4y3+LkGQFjwea2FE68RXWjslWeyrRUlirXhMNV8/jGB9UtJgFLva7Y99573/FZ1M9R4JWxQvveKN2sp4+vON6/tKv+C2n+oYH8jJquQeFA3sWMKMS4fCbXoH+4lhkd6ktywESpdChW8eC7ScUe9v2VUwauFQtBKgCznvUBw9tfMJGTj7xfneeILl6XuUxjeyE/8PHrHcU1tVws72T9azGKjd+TgYoKiL5/+hbuQqtEWJ775Xi7oB0Fk7zwP4B3Mq08+n84Xmn0au8IG1muYj/bAzAA5/7VtqaBjw0FevbigkyxpArqXyDcLt5pvXLsKXu0+3H7ciX2vUAyrRa39boEVT52ZhrerGdv9wBvDvJaI0beMFSAZMZ1i7bPoNY2+/X9aNjwAJE4yQD4XDye69o8vGY43/jTqDE7RXePK9VA5bnFIAyfJyq/QLHtTE6VyMNOsrTQfUYKR5iv5rtlGhEnWbgOZOmzfLclPQhjTkZsCgiUZB81Zh02Rgr0w0hehkfVGJxQjn80V4kEpTK1192EY8MzlikiyDETXIJ8WjA0FO8DAG+ZdErUSVM7I+jvtBAvEhUQmnPRMmswi/ya4yCy86+4l3peuwvUHMTFaTKd0cyr1gkj3ILHIa0EaAOTH4emhwtYmTsWiJa+RJVdL2BvJplVrLawbYJfSFsh+ZWLcxVKsyeTkhdn48AAd0qad+BX44rBH7VN24yYrn/YK0AyDS1afAw7WbgS1EqqPNkBAGju0sm+aHL7xR+eAK/MnKaFQSIu5rIB2klOhv4uiNWDGrZhqshF8/IJ4s0bYYsTBzJaYdAFHqSxRz6LI5QEEHnSQCrZcpIsKAd2/AZ3lEoNgroxtmvSyLdElXSWlqqmDFIERLxDWyXHCOXOShzQgf4xCPovCkVhv/14ASMzwPLCeLM6RwDWiiuBHAeFmsH43GHhVa1nUqT/Xjc5jqoCz3yJgBQeAP3DUz9jYvc2aO0CiEAyKcIgicZpehq+AK+iVoGgqvTF7ez3+VJo8b1xI0LkxyTgSrOvQpW0K6D7gEFPNGCmTL+2vDfD69UP8UWUT+0EGDR/fo/LGG5hXDIDBGwPsDc+YS9bUxDWiCz31Lq9VPoJfZGAE6AlOB9NxCX+0MW8BACF6LzIcHDoYU5XPte2muwb/IoRES7qkesxmC6aRTyD0J7SpPDETz4gkxDa/06fsq6JBKkk9nL9xjAnMRfTZ1l/PFSPyw97s0IiCjhw9qLZ0AMTypdVf70ZbnzbOxH+b/RQLhKPXJIv0YdDd+VgpKEoyCaZ6DdKkeTCTJeukL/v2p+zeatD9I6wB3zpZd7uAxAXB4p0C70QLSOZV8tS8NBkKqlT4wMuY1f3KJFhOfnHbQPtah01DoLU6LVnxh9raXLKqX6QzrGlqhU/Z37WG+2k6Qq6UsqqX/Pl6cpKGT8ZHDOExab387CTCIc7tar9kFjWOS1i5utrKI1dp4PFpWD4F0UyRSVAbdqt+foVuMrgNrjS/+K/yYhXdSr5sQLohS78a0616L1FEkb1R257ifBU630BWvKrdhRNxZykeG5Wb0HaOcQNdvnJ+aGzewRdbU+qPuvW4evru1Iu6Udygxr3hQmzHu5OgSgSYPL9t3z9DCXr+M+nrOCzX0vBepdjMNEOkalFDsWi28yzcNbFGFh3OZ+gZpifvCh5NOS0tX37m/VxYc2evsssjjXSncfOSX8n+LCaD3DS8UAIfaoOOt6QmLfpgg7Yj79GjqLFxoKDOKeB0gbvul2ucu4bsa7lopQZKQ2a2fpx5EJOC8mXmjAh0CDui42kLPSig532rH8gEyZh6/2BJZxpN2x+rfQhmRDsInKHpvqkleyjkpU+2JTilM+NqGMYVa0RqXiA2btczw10/F5OCk9vIr3N8kS0alw1LLdbWewJi82llzOwZGZ76p4VmCNyEtfAk4wz3K4ER0RCG02XHrBA9q/qe5Us6ckxh78UWNyMZBJlGgHjAJ1NJSJiIeUUpQoSwNoC05OTkr/////Sv////9LAHSUYk1wAoWUaBV0lFKUjANwb3OUSxx1jAloYXNfZ2F1c3OUSwCMBWdhdXNzlEcAAAAAAAAAAHVidWIu",
|
26 |
"dtype": "float32",
|
27 |
"shape": [
|
28 |
8
|
|
|
31 |
"high": "[inf inf inf inf inf inf inf inf]",
|
32 |
"bounded_below": "[False False False False False False False False]",
|
33 |
"bounded_above": "[False False False False False False False False]",
|
34 |
+
"_np_random": "RandomState(MT19937)"
|
35 |
},
|
36 |
"action_space": {
|
37 |
":type:": "<class 'gym.spaces.discrete.Discrete'>",
|
|
|
42 |
"_np_random": null
|
43 |
},
|
44 |
"n_envs": 16,
|
45 |
+
"num_timesteps": 1507328,
|
46 |
+
"_total_timesteps": 1500000,
|
47 |
"_num_timesteps_at_start": 0,
|
48 |
"seed": null,
|
49 |
"action_noise": null,
|
50 |
+
"start_time": 1652303687.7713685,
|
51 |
"learning_rate": 0.0003,
|
52 |
"tensorboard_log": "tmp/",
|
53 |
"lr_schedule": {
|
|
|
56 |
},
|
57 |
"_last_obs": {
|
58 |
":type:": "<class 'numpy.ndarray'>",
|
59 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGbG9DopwC+6+WzGOg8LZzYXPT86+tHluQAAgD8AAIA/zdCdPFyjJrpG5xk59zbctcqzMDoPxC64AACAPwAAgD8zi7O79nKYP52NSbwvwRu/CrFtvILHjj0AAAAAAAAAAJqRprt7FIc3qtXTOt55EzV7DCA7sj8BugAAgD8AAIA/mvtOPcOFDbpeV1Y4HyAStVi0uTv7g3q3AACAPwAAgD8zmxQ7XONYuo9pHTtEu601MPwAuH7ONboAAIA/AACAP81RZz0KFwO5nVPmvIDQcTQn46Q7iFz+swAAgD8AAIA/mhAmvSkoZ7qwHF86SZ6ENRTxQbpsJoC5AACAPwAAgD8aq1O94TibPcMt4L3sJFG+x0sRvtAoWb0AAAAAAAAAAA36oT32jEy6AsaGO+uujjjF7pk62poeugAAgD8AAIA/MxXavClQObpTRJg7aUYeONO5MDpKs8m3AACAPwAAgD+A1xW9KYBmurNlkjud1Og4+Fs3Osw+LroAAIA/AACAP3CC374r7GU/LJivvnpHEr89Lea+Wie4vAAAAAAAAAAAM0OVPbFl1z1K8le4YBd4vqf+szzj+ne8AAAAAAAAAADAbpi95QGDP0fOi74kpR2/J4givciUPrwAAAAAAAAAAAZCj761R4k+WN7RPgDjhb5uiR69+72bPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
60 |
},
|
61 |
"_last_episode_starts": {
|
62 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
66 |
"_episode_num": 0,
|
67 |
"use_sde": false,
|
68 |
"sde_sample_freq": -1,
|
69 |
+
"_current_progress_remaining": -0.004885333333333408,
|
70 |
"ep_info_buffer": {
|
71 |
":type:": "<class 'collections.deque'>",
|
72 |
+
":serialized:": "gAWVdxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIIlD9g0jqYkCUhpRSlIwBbJRN6AOMAXSUR0CcMJJqqOtGdX2UKGgGaAloD0MIQ/6ZQXxASUCUhpRSlGgVS6xoFkdAnDMnoxHoYHV9lChoBmgJaA9DCCEHJcy0dWJAlIaUUpRoFU3oA2gWR0CcNKT9KmKqdX2UKGgGaAloD0MIF3/bEyTpaUCUhpRSlGgVTegDaBZHQJw3GE4//vR1fZQoaAZoCWgPQwgOv5tu2WdkQJSGlFKUaBVN6ANoFkdAnEDnCKrJbXV9lChoBmgJaA9DCG/W4H3V/GdAlIaUUpRoFU3oA2gWR0CcQanYg7o0dX2UKGgGaAloD0MILjpZaj0qZ0CUhpRSlGgVTegDaBZHQJxC2oIfKZF1fZQoaAZoCWgPQwggtYmT+wNOwJSGlFKUaBVNSwJoFkdAnEMDvNNahnV9lChoBmgJaA9DCEmfVtGfUGZAlIaUUpRoFU3oA2gWR0CcSFRSgoPTdX2UKGgGaAloD0MIaoZUUTy8ZUCUhpRSlGgVTegDaBZHQJxI+UD+zdF1fZQoaAZoCWgPQwitiJro8+tRQJSGlFKUaBVLwWgWR0CcS7rZ8KG+dX2UKGgGaAloD0MIy5wui4kdO0CUhpRSlGgVS7poFkdAnEyY+W4Vh3V9lChoBmgJaA9DCGGm7V9ZamhAlIaUUpRoFU3oA2gWR0CcTl7btZ3cdX2UKGgGaAloD0MI7upVZPSQYkCUhpRSlGgVTegDaBZHQJxOugvlEJB1fZQoaAZoCWgPQwiKPEm65ghkQJSGlFKUaBVN6ANoFkdAnE9Y1+AmRnV9lChoBmgJaA9DCJDZWfTOqmVAlIaUUpRoFU3oA2gWR0CcT2radtl7dX2UKGgGaAloD0MIwoTRrGxxQsCUhpRSlGgVTQgBaBZHQJxQD8aXKKZ1fZQoaAZoCWgPQwie0OtPYodiQJSGlFKUaBVN6ANoFkdAnF0iKWLP2XV9lChoBmgJaA9DCPN0riglz2ZAlIaUUpRoFU3oA2gWR0CcXgNgBtDVdX2UKGgGaAloD0MIpkV9kjt/ZUCUhpRSlGgVTegDaBZHQJxkrU4JeE91fZQoaAZoCWgPQwgbf6KyYfBnQJSGlFKUaBVN6ANoFkdAnGcpSvTw2HV9lChoBmgJaA9DCKd1G9R+z2JAlIaUUpRoFU3oA2gWR0CcaG1stTUBdX2UKGgGaAloD0MIKEnXTL7MaECUhpRSlGgVTegDaBZHQJxqstqYZ2p1fZQoaAZoCWgPQwgbEYyDy7dmQJSGlFKUaBVN6ANoFkdAnHUWTot+TnV9lChoBmgJaA9DCG/Tn/3ITGBAlIaUUpRoFU3oA2gWR0Ccffa7VawEdX2UKGgGaAloD0MI8NsQ4zWkZkCUhpRSlGgVTegDaBZHQJx+xOIqLCN1fZQoaAZoCWgPQwguHAjJgkFlQJSGlFKUaBVN6ANoFkdAnKlPJA+pwXV9lChoBmgJaA9DCONsOgK4CGVAlIaUUpRoFU3oA2gWR0CcqlaAFxGUdX2UKGgGaAloD0MIAn6NJMFgY0CUhpRSlGgVTegDaBZHQJysWk2xY7t1fZQoaAZoCWgPQwgtJ6H0BcJlQJSGlFKUaBVN6ANoFkdAnKzet0V8C3V9lChoBmgJaA9DCFX2XRH8EGVAlIaUUpRoFU3oA2gWR0CcrX3Q2MsIdX2UKGgGaAloD0MIvMtFfCdGYECUhpRSlGgVTegDaBZHQJytn9R77bd1fZQoaAZoCWgPQwg2j8Ngfq5qQJSGlFKUaBVN6ANoFkdAnK40vXbudHV9lChoBmgJaA9DCJC93v3xbmVAlIaUUpRoFU3oA2gWR0CcvQzH0btJdX2UKGgGaAloD0MIeAyP/SzXZ0CUhpRSlGgVTegDaBZHQJy+ByvLX+V1fZQoaAZoCWgPQwh2weCaO9hlQJSGlFKUaBVN6ANoFkdAnMTl8XvYvnV9lChoBmgJaA9DCCS05VwKBmVAlIaUUpRoFU3oA2gWR0Ccx3/PPcBVdX2UKGgGaAloD0MIPBOaJJaJZkCUhpRSlGgVTegDaBZHQJzI1Bv73wl1fZQoaAZoCWgPQwjuW60TF85gQJSGlFKUaBVN6ANoFkdAnMseIAOrhnV9lChoBmgJaA9DCC8yAb/G8mNAlIaUUpRoFU3oA2gWR0Cc1ejfNzKcdX2UKGgGaAloD0MIzZVBtUESZkCUhpRSlGgVTegDaBZHQJzfLBAOav11fZQoaAZoCWgPQwhsdw/QfWNjQJSGlFKUaBVN6ANoFkdAnOAO1KGtZHV9lChoBmgJaA9DCDGyZI5ltWRAlIaUUpRoFU3oA2gWR0Cc43U83dbgdX2UKGgGaAloD0MIwAZEiCujY0CUhpRSlGgVTegDaBZHQJzkY2CNCJJ1fZQoaAZoCWgPQwgK16NwvTtlQJSGlFKUaBVN6ANoFkdAnOZWx2SuAHV9lChoBmgJaA9DCAdCsoAJcGRAlIaUUpRoFU3oA2gWR0Cc5saVlf7adX2UKGgGaAloD0MIuYybGmgyZ0CUhpRSlGgVTegDaBZHQJznZV4oqkN1fZQoaAZoCWgPQwi6u86G/FFkQJSGlFKUaBVN6ANoFkdAnOd3YcvM83V9lChoBmgJaA9DCOksswhF0WRAlIaUUpRoFU3oA2gWR0Cc6BxPfsNUdX2UKGgGaAloD0MIeCXJc30vUECUhpRSlGgVS7NoFkdAnO+uLrHEM3V9lChoBmgJaA9DCIygMZOo9GVAlIaUUpRoFU3oA2gWR0Cc9zIk7fYSdX2UKGgGaAloD0MIxTh/EwqgYUCUhpRSlGgVTegDaBZHQJz4PJ6po9N1fZQoaAZoCWgPQwgw9IjR8wdjQJSGlFKUaBVN6ANoFkdAnQAb6xgRb3V9lChoBmgJaA9DCO/FF+3xT2VAlIaUUpRoFU3oA2gWR0CdAu8SPEKmdX2UKGgGaAloD0MIggAZOnbgXkCUhpRSlGgVTegDaBZHQJ0Ela3Zwn91fZQoaAZoCWgPQwh5k9+ik/1jQJSGlFKUaBVN6ANoFkdAnQdbgsK9f3V9lChoBmgJaA9DCAbxgR3/4GRAlIaUUpRoFU3oA2gWR0CdExj7hvR7dX2UKGgGaAloD0MIbW+3JIf1Z0CUhpRSlGgVTegDaBZHQJ0c7FHavid1fZQoaAZoCWgPQwj7H2Ct2uRkQJSGlFKUaBVN6ANoFkdAnR2/FaSs83V9lChoBmgJaA9DCFThz/DmwmVAlIaUUpRoFU3oA2gWR0CdISW2PT5PdX2UKGgGaAloD0MIuTmVDABaZECUhpRSlGgVTegDaBZHQJ0iLRCx/ut1fZQoaAZoCWgPQwiXjc75qdxlQJSGlFKUaBVN6ANoFkdAnUzwtJ4B3nV9lChoBmgJaA9DCOZatABt4GZAlIaUUpRoFU3oA2gWR0CdTXUiY9gXdX2UKGgGaAloD0MITFXa4hoQZUCUhpRSlGgVTegDaBZHQJ1OE//vOQh1fZQoaAZoCWgPQwgF3V7SGP9iQJSGlFKUaBVN6ANoFkdAnU7fnfVI7XV9lChoBmgJaA9DCFzjM9k/pFBAlIaUUpRoFUvCaBZHQJ1TYifQKKJ1fZQoaAZoCWgPQwhAvRk1X105QJSGlFKUaBVLrWgWR0CdVsH1OCXhdX2UKGgGaAloD0MI7x01JkRJZ0CUhpRSlGgVTegDaBZHQJ1XKw5eZ5R1fZQoaAZoCWgPQwjz5JoCmYBnQJSGlFKUaBVN6ANoFkdAnV0nUUfxMHV9lChoBmgJaA9DCH1AoDNpmGhAlIaUUpRoFU3oA2gWR0CdXgiI+GGmdX2UKGgGaAloD0MIwYwpWOMfZUCUhpRSlGgVTegDaBZHQJ1j5LUTcqR1fZQoaAZoCWgPQwheLXdmgsBjQJSGlFKUaBVN6ANoFkdAnWZQ9eQdS3V9lChoBmgJaA9DCGWKOQg61mRAlIaUUpRoFU3oA2gWR0CdZ7msvIwNdX2UKGgGaAloD0MI6lp7n6opZ0CUhpRSlGgVTegDaBZHQJ1p2nrIHTt1fZQoaAZoCWgPQwg6IXTQJdlTQJSGlFKUaBVLrGgWR0Cdb2p2ECeVdX2UKGgGaAloD0MI3sZmRyqDZkCUhpRSlGgVTegDaBZHQJ10FMWXTmZ1fZQoaAZoCWgPQwiNRj6v+PBmQJSGlFKUaBVN6ANoFkdAnX1DgAIY33V9lChoBmgJaA9DCAfRWtHmp2VAlIaUUpRoFU3oA2gWR0Cdfg0G/vfCdX2UKGgGaAloD0MIRUlIpO09ZkCUhpRSlGgVTegDaBZHQJ2CBNFjNIN1fZQoaAZoCWgPQwjg9ZmzPoFlQJSGlFKUaBVN6ANoFkdAnYQIMfA9FHV9lChoBmgJaA9DCDWYhuGj1GNAlIaUUpRoFU3oA2gWR0CdhIyfL9uQdX2UKGgGaAloD0MI6zao/VYxaECUhpRSlGgVTegDaBZHQJ2F9vVEuxt1fZQoaAZoCWgPQwh/ox03/D1hQJSGlFKUaBVN6ANoFkdAnYsjLSuyNXV9lChoBmgJaA9DCKkT0ETYHWVAlIaUUpRoFU3oA2gWR0CdjhwcHWz4dX2UKGgGaAloD0MILPNWXYfwZkCUhpRSlGgVTegDaBZHQJ2OkJMQEp11fZQoaAZoCWgPQwjFcHUARFVkQJSGlFKUaBVN6ANoFkdAnZTPYvnKXHV9lChoBmgJaA9DCJKwbycRYWVAlIaUUpRoFU3oA2gWR0CdlYwpe/pMdX2UKGgGaAloD0MIBmUaTS6gZECUhpRSlGgVTegDaBZHQJ2boRSP2f11fZQoaAZoCWgPQwgHlbiOcZljQJSGlFKUaBVN6ANoFkdAnZ/JWV/tpnV9lChoBmgJaA9DCH9rJ0rCrWVAlIaUUpRoFU3oA2gWR0CdolE+gUUPdX2UKGgGaAloD0MIxqLp7GTvZkCUhpRSlGgVTegDaBZHQJ2oljurp7l1fZQoaAZoCWgPQwi+FB40u/hSQJSGlFKUaBVLtWgWR0Cdqr0gKWszdX2UKGgGaAloD0MIih9j7toqYUCUhpRSlGgVTegDaBZHQJ2tbnoxHoZ1fZQoaAZoCWgPQwhSZRh3g8JRQJSGlFKUaBVLq2gWR0Cds2WGRFI/dX2UKGgGaAloD0MIBwq8k08gXECUhpRSlGgVTegDaBZHQJ22/yH2ys11fZQoaAZoCWgPQwiNmq+SD3NiQJSGlFKUaBVN6ANoFkdAnbfmjGkvb3V9lChoBmgJaA9DCGiyf54GhEpAlIaUUpRoFUulaBZHQJ24sBhhH9Z1fZQoaAZoCWgPQwhOKhprf/tfQJSGlFKUaBVN6ANoFkdAnbxpElVtGnV9lChoBmgJaA9DCLt868P6n2NAlIaUUpRoFU3oA2gWR0CdvoER8MNMdX2UKGgGaAloD0MIineAJ63vZECUhpRSlGgVTegDaBZHQJ2/BX2dupF1ZS4="
|
73 |
},
|
74 |
"ep_success_buffer": {
|
75 |
":type:": "<class 'collections.deque'>",
|
76 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
77 |
},
|
78 |
+
"_n_updates": 736,
|
79 |
"n_steps": 2048,
|
80 |
"gamma": 0.998,
|
81 |
+
"gae_lambda": 0.995,
|
82 |
"ent_coef": 0.01,
|
83 |
"vf_coef": 0.5,
|
84 |
"max_grad_norm": 0.5,
|
85 |
+
"batch_size": 256,
|
86 |
+
"n_epochs": 16,
|
87 |
"clip_range": {
|
88 |
":type:": "<class 'function'>",
|
89 |
":serialized:": "gAWVkQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGFDOlxVc2Vyc1xtYWxoc2FsXGRldlxkYmNvbmRhLTIwMjFfMDUtcHkzOC1yMzZcbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgNdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
ppo-LunarLander-v2/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 84637
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3b0d81313c36fc9173c9d9e26fd47999d5f546488ecb30ee8f369a0c4c86083
|
3 |
size 84637
|
ppo-LunarLander-v2/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43073
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3499a539a73d6f077ba3e8fe992ee74c2eafa69036a725da13b9143a8694b04
|
3 |
size 43073
|
replay.mp4
ADDED
File without changes
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 270.9381606251052, "std_reward": 27.90070855706005, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-11T17:59:47.340160"}
|