dlarionov commited on
Commit
5a2122e
1 Parent(s): 62cdfc9

Uploaded first LunarLander-v2 model

Browse files
PPO_1M_LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0a919ed9304b7627d7e411e2f5782e1ef35346fd628ee53e4eeda9f6734c64c
3
- size 147991
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fead3c0948ece8d12d0153f204a527c0fbf31130fc62053832703d8ff91820e
3
+ size 147995
PPO_1M_LunarLander-v2/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7b6a3ce4c5e0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7b6a3ce4c670>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7b6a3ce4c700>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7b6a3ce4c790>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7b6a3ce4c820>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7b6a3ce4c8b0>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7b6a3ce4c940>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7b6a3ce4c9d0>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7b6a3ce4ca60>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7b6a3ce4caf0>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7b6a3ce4cb80>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7b6a3ce4cc10>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7b69dac91e40>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
@@ -26,12 +26,12 @@
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1720110596510561847,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADAVWb6ID4a8JqoSO9fZODkGvAI+U443ugAAgD8AAIA/kzBEvhydWrxn4IA79WyEOeZXxT3vLJ26AACAPwAAgD/gUgm+VOC0P/Lc776lAre+w8jrvWKj270AAAAAAAAAAJomyrz/HSc/qWU3Pbb/077JAAU7jdlwPQAAAAAAAAAAZtLouyrqqT94VHG9XzbpvvPfy7tm+Rm8AAAAAAAAAADzMsI9KSQUugFQAbkCzfezC6ouOwOLGjgAAAAAAACAP9NPY769RHw8cw2lPCGSDTySaVy+S3YvPQAAgD8AAIA/mnOFvFhLAD8CECa9V8fWvsgUzTwl8vs8AAAAAAAAAAAmbSy+hpqFPp0DVT1tioy+DrUqvEIjWzwAAAAAAAAAADNFrzz2EF+6egmmtu7+QbLk82w78AvCNQAAgD8AAIA/OjcyvsPtdLwKoIi7d1bwuf2j5T3plME6AACAPwAAgD8Yuau+HAePvSDa+7kzg/y4FDe2PnYXbjkAAIA/AACAPwDJjL3DaXG6RqibtZWGULAnwq061k2yNAAAgD8AAIA/zgqCvlKxzDxSpYQ6jjscudhXX74A87C5AACAPwAAgD8gHiy+qL+avIpUiLyjzSa7RzsJPk5/AzwAAIA/AACAP4DY1T1gxL4/2p/7PrKxnb3HPJw9mmM7PgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -45,7 +45,7 @@
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWV/QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG3r2FFlTWKMAWyUS+yMAXSUR0CVreXgLqlhdX2UKGgGR0Bgy/T/hl19aAdN6ANoCEdAla3xxYJVsHV9lChoBkdAbkgZXMhX82gHTXkBaAhHQJWut46fapR1fZQoaAZHQHD/67yxzJZoB0v9aAhHQJWu9iH6/It1fZQoaAZHQG7dmwaBI4FoB0vhaAhHQJWvXt3OfNB1fZQoaAZHQHCay7GvOhVoB0vyaAhHQJWv2JtSAH51fZQoaAZHQHFwNkFwDNhoB00WAWgIR0CVsHoL5RCQdX2UKGgGR0BYi0SElE7XaAdN6ANoCEdAlbFIgA6uGXV9lChoBkdAb0oaLGaQWGgHS+poCEdAlbHfomoitHV9lChoBkdAbfL5KODJ2mgHS9xoCEdAlbIy8WbgCXV9lChoBkdAcdLsCDEm6WgHTQ4BaAhHQJWybg9/z8R1fZQoaAZHQG/zk0SAYpFoB022A2gIR0CVsoFpwjt5dX2UKGgGR0BxAiU0Nz8xaAdL9WgIR0CVsvhkAggYdX2UKGgGR0BxGyWJJoTPaAdLzWgIR0CVs059Vmz0dX2UKGgGR0Bwx1UyYXwcaAdL1mgIR0CVs6GyHEdedX2UKGgGR0BxbC/fwZwXaAdNBAFoCEdAlbPZmRNh3XV9lChoBkdAchyhHskY42gHS91oCEdAlbU4ESuhbnV9lChoBkdAcBkT1kDp1WgHS/hoCEdAlbVQudwvQHV9lChoBkdARFECkoF3ZGgHS79oCEdAlbZIN3GGVXV9lChoBkdAcUSxKg7HQ2gHTR0BaAhHQJW2i5nUUfx1fZQoaAZHQHIxgFTvRZ5oB00PAWgIR0CVtxmdy1eCdX2UKGgGR0Bv6j1uivgWaAdLzmgIR0CVt2Fj/dZadX2UKGgGR0BwUwqd6LOzaAdNDQFoCEdAlbe287IT5HV9lChoBkdAcNz+fywwCmgHS+xoCEdAlbjdAood/HV9lChoBkdANOrlmvnr6mgHS8FoCEdAlbjp2yLQ5XV9lChoBkdAcKMEqUeMh2gHS/poCEdAlbk5+hGpdnV9lChoBkdAcJPr92ovSWgHTQoBaAhHQJW5bJ5mh/R1fZQoaAZHQHCghPfsNUhoB0v8aAhHQJW54ntv4ud1fZQoaAZHQGwzGbCrLhdoB0v6aAhHQJW6MWfseGR1fZQoaAZHQHHjLG7z06JoB0vZaAhHQJW7Sp6yB091fZQoaAZHQG8gzyJ9AopoB0vqaAhHQJW73ndO6/Z1fZQoaAZHQHBEySJTER9oB0vqaAhHQJW89SR8twt1fZQoaAZHQHDpxTn7pFFoB01KAWgIR0CVvSXZ5AyEdX2UKGgGR0Bxcm+De0ojaAdL2GgIR0CVvU+g13t8dX2UKGgGR0Bhyb72tdRjaAdN6ANoCEdAlb3pNfw7T3V9lChoBkdAcd8PYWcjJWgHTQIBaAhHQJW9+dbxEv11fZQoaAZHQG3Aj5bhWHVoB0vraAhHQJW+HIMjNY91fZQoaAZHQHAN1BQemvZoB00BAWgIR0CVvwlWfbsXdX2UKGgGR0BuDjobGWD6aAdL5WgIR0CVv3oTfzjFdX2UKGgGR0BwJuifxtpFaAdL1mgIR0CVv/wfyPMjdX2UKGgGR0BvwcEJSiudaAdL7mgIR0CVwDDNyHVPdX2UKGgGR0Bw0wQSSNfgaAdL/2gIR0CVwHkCFK02dX2UKGgGR0BxNNEofCAMaAdNJQFoCEdAlcEwDq4YrXV9lChoBkdAbzE+6iCaqmgHTRkBaAhHQJXCISRKYiR1fZQoaAZHQHJ8ItQKrrBoB0v8aAhHQJXDBYigTRJ1fZQoaAZHQG9d8zQ/oq1oB0vaaAhHQJXDEyHmA9V1fZQoaAZHQHAJLEtNBWxoB0vsaAhHQJXDuruIAOt1fZQoaAZHQG+frQokRjBoB0vaaAhHQJXEBc1O0sx1fZQoaAZHQG1jTLfUF0RoB0vmaAhHQJXESzcAR051fZQoaAZHQHEaT7MxGlRoB00HAWgIR0CVxKIy0rsjdX2UKGgGR0Bws8sMAmzCaAdNTQFoCEdAlcS44p+c6XV9lChoBkdAcDK5mh/RV2gHS/BoCEdAlcTFx0dRznV9lChoBkdAb591ZkkKNWgHS9ZoCEdAlcT6WHDaXnV9lChoBkdAbSUIvalDW2gHS/NoCEdAlcadlVcUunV9lChoBkdAa8hOsT37DWgHS+poCEdAlcbbSVnmJXV9lChoBkdAceuO09hZyWgHTRUBaAhHQJXHDSx7iQ11fZQoaAZHQG+fF2vB7/poB0vvaAhHQJXHrx+az/p1fZQoaAZHQHDkmmYSg5BoB00EAWgIR0CVyUaDf3vhdX2UKGgGR0BkYEkKNQ0oaAdN6ANoCEdAlcm7QTmGNHV9lChoBkdAbdPsxfv4NGgHS/FoCEdAlcny+HrQgXV9lChoBkdAbbF1jiGWU2gHS8NoCEdAlcqA/s3Q2XV9lChoBkdAb69lzU7SzGgHS+BoCEdAlcqVtGd7OXV9lChoBkdAcT7pLmITG2gHS+VoCEdAlcsdC/oJRnV9lChoBkdAb91yH2ys0mgHTQIBaAhHQJXLaveP7vZ1fZQoaAZHQG3FslTm4iJoB0vVaAhHQJXLc2Q4jr11fZQoaAZHQHBd6Jyhi9ZoB0vvaAhHQJXL2xhUipx1fZQoaAZHQHDtg2VE/jdoB0v9aAhHQJXMaPq9oOB1fZQoaAZHQHL4VHrhR65oB0vSaAhHQJXOCDzyz5Z1fZQoaAZHQG74MQVbiZRoB0vraAhHQJXOZKHwgDB1fZQoaAZHQHJIATZg5R1oB0v7aAhHQJXPTVJ+UhV1fZQoaAZHQG3NdvKlpGpoB0vfaAhHQJXPdEiMYMx1fZQoaAZHQHLtOIZZSvVoB0vkaAhHQJXSIXgtOEd1fZQoaAZHQHEy5DRc/t9oB0vxaAhHQJXSSNn5BTp1fZQoaAZHQHFR2ahHskZoB0v3aAhHQJXTGe5Fw1l1fZQoaAZHQG2eJHZsbedoB0voaAhHQJXTGWldkax1fZQoaAZHQG+4px3mmtRoB0vfaAhHQJXTZvES/TN1fZQoaAZHQG4kUhNdqtZoB0vqaAhHQJXULvBrN4Z1fZQoaAZHQHD3eafBeoloB00MAmgIR0CV1G1uzhP1dX2UKGgGR0BwR5/Aj6eoaAdL9WgIR0CV1QyiVSn+dX2UKGgGR0BwcdpN9H+ZaAdNMQFoCEdAldWg+EAYHnV9lChoBkdAccfjNY8uBmgHS99oCEdAldYiwnpjc3V9lChoBkdAb6yhxo7FKmgHS81oCEdAldaLZJ04i3V9lChoBkdAbpdzbvgFYGgHS/5oCEdAldcyWRigCnV9lChoBkdAcL+qtYB/7WgHTUsBaAhHQJXXwutfXwt1fZQoaAZHQG8gNHpbD/FoB00SAWgIR0CV2HkT6BRRdX2UKGgGR0BxFIzhxYJWaAdL9GgIR0CV2cA7xNItdX2UKGgGR0BsC7ytmtheaAdL42gIR0CV2iD15B1LdX2UKGgGR0BvemUliSaFaAdL0mgIR0CV2nDTz/ZNdX2UKGgGR0Bxmf4CZF5OaAdNDgFoCEdAldqATh5xBHV9lChoBkdAcMPRfF72MGgHS9toCEdAldqI0EX+EXV9lChoBkdAcLXanJkoW2gHS/9oCEdAldq/fTCtR3V9lChoBkdAR8NmjCYTkGgHS9RoCEdAlduoIjW07nV9lChoBkdAa1MdGy5ZsGgHS/FoCEdAldvW16Vt43V9lChoBkdAcUbEOiFj/mgHS+BoCEdAld0NxlxwQ3V9lChoBkdAbher3j+72GgHS+xoCEdAld8B1LamGnV9lChoBkdAbpCIXTEzf2gHS+FoCEdAld+GcFyJbnV9lChoBkdAXiMXcgyM1mgHTegDaAhHQJXfmnhsImh1fZQoaAZHQHDZt+b3Gn5oB0veaAhHQJXhoqMFUyZ1fZQoaAZHQG0dS3b212JoB0vyaAhHQJXh5tSAH3V1fZQoaAZHQHFNXP/rB0poB0vmaAhHQJXiLfxc3VF1ZS4="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x799e1e081bd0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x799e1e081c60>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x799e1e081cf0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x799e1e081d80>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x799e1e081e10>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x799e1e081ea0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x799e1e081f30>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x799e1e081fc0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x799e1e082050>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x799e1e0820e0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x799e1e082170>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x799e1e082200>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x799e1e018ec0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
 
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1720160375106397861,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAANPxQD5O3rC8OiVtO6d2zLk3Oh2+8U6dugAAgD8AAIA/OtU8vlx4dbyWnB07rF9IOcd62z2fHEi6AACAPwAAgD/NU8y9e4SaukHHvT3JUUM2J+cAuwa/OjUAAIA/AAAAAACQl7xBk4w/7Pu1u7qpTb/gjm28XouoPAAAAAAAAAAAzQqMvNEkmT83+wC+NyBRv7PambySBJM8AAAAAAAAAAAAVMY9u6j3PcZLWD0DRTy+XYSYPQtfer0AAAAAAAAAAD3ym76p0zY+gTxIPrgHhb4Y26W8WhqZPQAAAAAAAAAApgtFPnt1oLw5b766Kl8MORnWDr6emfE5AACAPwAAgD9a9pW9hUvMuUIuGDNz7ZOwuQgyuwn9wrMAAIA/AACAPxp9+z3kCnQ+G7P8PMetxb7vcAg9wjVwPAAAAAAAAAAAM3U0PZT8k7xS6aq8wQr/vIVeOb0Gvn6+AACAPwAAgD+G/zc+mzK6vD4cpLqFPhI5YcYivmbS4DkAAIA/AACAP/anij67Phw/2tIPPDPOBb+CzxA+76EkvgAAAAAAAAAA0yMfPoXStLtIRg29Wh/aOikoH71VxNg7AACAPwAAgD/63DE+4ZyHvItkwzqq1xG5S37qveo5AroAAIA/AACAP/rRjD7IspU+q9xyvU4Qqb5dGZE9Y5T9OwAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWVAQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHFkxXXAdn2MAWyUTQ4BjAF0lEdAlaMG9+PRzHV9lChoBkdAc32Dr7fpEGgHTRsBaAhHQJYCud9Ujs51fZQoaAZHQHAZUdaMaS9oB0u+aAhHQJYC8N6PbPB1fZQoaAZHQHBZ3AAQxvhoB0vVaAhHQJYDsriEQGx1fZQoaAZHQGKVNwaR6nloB03oA2gIR0CWA8SR8twrdX2UKGgGR0BxGZsEaESNaAdL2GgIR0CWBSKzRhMKdX2UKGgGR0BxVcqFyq+8aAdLwmgIR0CWBb9iMHbAdX2UKGgGR0Bu+ivRqoIfaAdLuGgIR0CWBwWpIczZdX2UKGgGR0Bx7OyNXHR1aAdNOAFoCEdAlgfvGACnxnV9lChoBkdAcpqMdLg4wWgHTQoBaAhHQJYI2p0fYBh1fZQoaAZHQHC4aoIfKZFoB0u1aAhHQJYJZSDRMOB1fZQoaAZHQHJPSrgflp5oB0vPaAhHQJYKJUEPlMh1fZQoaAZHQHKgbR4QjD9oB01iAWgIR0CWClXkYGdJdX2UKGgGR0BwszjvNNahaAdLx2gIR0CWDFRWtEG8dX2UKGgGR0BxPFkK/mDEaAdLzWgIR0CWDovx6OYIdX2UKGgGR0Bu3sQ2/BWQaAdLvmgIR0CWD/8CgbqAdX2UKGgGR0BvaeoLofSyaAdLs2gIR0CWEWMxXXAedX2UKGgGR0BfAabayrxRaAdN6ANoCEdAlhG4hdMTOHV9lChoBkdAcL8b8WKuS2gHS+RoCEdAlhLXVbzK93V9lChoBkdAZPq1BMSK32gHTegDaAhHQJYUABXCCSR1fZQoaAZHQHGslKsdT5xoB0vsaAhHQJYUcVsUIs11fZQoaAZHQHI3ZHqeK9BoB0u1aAhHQJYUzwkPczt1fZQoaAZHQGP9E56t1ZFoB03oA2gIR0CWF8Lr5ZbIdX2UKGgGR0By6u3gDRtxaAdNrQFoCEdAlhiGEkB0ZHV9lChoBkdAcO5xWkrPMWgHS8doCEdAlhkFEE1VHXV9lChoBkdAcGtdyksSTWgHS6JoCEdAlhq4JiRW93V9lChoBkdAcNC+MIeHSGgHS9JoCEdAlhtx8lXzUnV9lChoBkdAbx073fyf+WgHS7JoCEdAlhyQvYe1bHV9lChoBkdAcF93gDRtxmgHS+NoCEdAlh2uKjzqbHV9lChoBkdAX66hXbM5fmgHTegDaAhHQJYfVG4I8hd1fZQoaAZHQHIc4TfzjFRoB0voaAhHQJYfple4Tbp1fZQoaAZHQG8IO+RHPNVoB0usaAhHQJYgvyhBZ6l1fZQoaAZHQHEvqzZ6D5FoB0vdaAhHQJYhptoBaLZ1fZQoaAZHQF7jNet0V8FoB03oA2gIR0CWIbCKaXrudX2UKGgGR0ByciBkI5YHaAdLqmgIR0CWIdR8+iaidX2UKGgGR0BxyDfYSQHSaAdL2WgIR0CWIf1ejVQRdX2UKGgGR0BjnnJ9y926aAdN6ANoCEdAliKE3S8aoHV9lChoBkdAbtzT3IuGsWgHTUwBaAhHQJYjSjnFHax1fZQoaAZHQHCOtrGipNtoB0vNaAhHQJYjWqCHymR1fZQoaAZHQG+cpR4yGi5oB0u5aAhHQJYjYa2nbZh1fZQoaAZHQHIhyqABkqdoB0u5aAhHQJYliLEUCaJ1fZQoaAZHQHE+b/XGwRpoB0vIaAhHQJYlt1SwW311fZQoaAZHQHGoT0th/iJoB0upaAhHQJYl+lsP8Q91fZQoaAZHQHJEvF3pwCNoB0uvaAhHQJYm9AJLM9t1fZQoaAZHQHFoE6o2n89oB00iAWgIR0CWJ0Wa+evqdX2UKGgGR0B0gRLi++M7aAdLtmgIR0CWKBFKCg9NdX2UKGgGR0BwnrGtITXbaAdL52gIR0CWKMR1HOKPdX2UKGgGR0ByHuQjlgc+aAdL+2gIR0CWKb53Tuv2dX2UKGgGR0ByD2CGvfTDaAdNAwFoCEdAlinZ8neBQXV9lChoBkdAcg+lC1JDmmgHS9VoCEdAlinilenhsXV9lChoBkdAb5qU6gdwN2gHS9RoCEdAlinshHLA6HV9lChoBkdAcLECE6DGtWgHS91oCEdAlio+lwcYInV9lChoBkdAYn4E+PikwmgHTegDaAhHQJYrG5Xlr/N1fZQoaAZHQGFNszl90A9oB03oA2gIR0CWKyr0J4SpdX2UKGgGR0ByYLr8iwB6aAdL32gIR0CWLLX7Lt/ndX2UKGgGR0BgACkqMFUyaAdN6ANoCEdAli5ee4Cp33V9lChoBkdAcXeOHWSU1WgHS6RoCEdAli5qWw/xD3V9lChoBkdAcGEus90RvmgHTQgBaAhHQJYuzoxHoX91fZQoaAZHQHBT5drwe/5oB0vvaAhHQJYvFoFmnO11fZQoaAZHQHFYFn27FsJoB0u7aAhHQJYvNFQVKwp1fZQoaAZHQHCGug13t8hoB0vBaAhHQJYvVWtEG7l1fZQoaAZHQHFq21UlzEJoB0vpaAhHQJYvhUbT+eh1fZQoaAZHQHDPDWCmMwVoB0u3aAhHQJYwFvuPV/d1fZQoaAZHQG38uXeFcptoB0vAaAhHQJYwXexfOUt1fZQoaAZHQHEDPhIe5nVoB02BAWgIR0CWML1EVnEmdX2UKGgGR0ByAnBdld1MaAdNTwFoCEdAljDhU70WdnV9lChoBkdAclE0fHPu5WgHS/9oCEdAljDrteD3/XV9lChoBkdAbsF/e+Eh7mgHS7doCEdAljL3w9aEBnV9lChoBkdAcILmEXcgyWgHS7loCEdAljQyp71Iy3V9lChoBkdAcM76ol2NemgHS9BoCEdAljSAiml67nV9lChoBkdAbxLGACnxa2gHS7ZoCEdAljTLKV6eG3V9lChoBkdAbxVJZGKAKGgHTTwBaAhHQJY1LOC5Etx1fZQoaAZHQHAvTbN8ma9oB0u+aAhHQJY1w23rleZ1fZQoaAZHQHG684DLbHpoB0vMaAhHQJY2WBlMAWB1fZQoaAZHQGLn64MF2V5oB03oA2gIR0CWNnKO1fE5dX2UKGgGR0Bw48a86FM7aAdL8WgIR0CWNsvxpcoqdX2UKGgGR0BxXZVLi++NaAdNRgFoCEdAljeJR0lqrXV9lChoBkdAcgyakRBeHGgHTRIBaAhHQJY4Yi7kGRp1fZQoaAZHQHEnijcmBvtoB0vdaAhHQJY5XM2WIGh1fZQoaAZHQHC+7iIcinpoB0uwaAhHQJY6WB/Zuht1fZQoaAZHQHPpy4Bmwq1oB0vTaAhHQJY7Equr6tV1fZQoaAZHQHJJgRf4REpoB00CAWgIR0CWPEzxPO6edX2UKGgGR0Bww2aa1Cw9aAdLwmgIR0CWPEycTakAdX2UKGgGR0BxZsf8uSOjaAdL2mgIR0CWPG6mfoRqdX2UKGgGR0Bt3CxNZeRgaAdLvmgIR0CWPK/vv0AcdX2UKGgGR0BxaSnNxEORaAdL12gIR0CWPQ5lvqC6dX2UKGgGR0BxYqAYpDu0aAdLtWgIR0CWPyk1Mue0dX2UKGgGR0Bxe/+kxh2GaAdL4GgIR0CWP4AuIyj6dX2UKGgGR0BycH9JjDsMaAdNdwFoCEdAlj++jIq9XnV9lChoBkdAb/DTAnDziGgHS8toCEdAlkD0hNdqtnV9lChoBkdAcc9ufEn9emgHS95oCEdAlkJcrZrYXnV9lChoBkdAct6L0SRKYmgHTY8CaAhHQJZCs1fmcON1fZQoaAZHQGcK/YSQHRloB03oA2gIR0CWQ49E1EVndX2UKGgGR0BxDYf9xZMdaAdL6WgIR0CWREUFB6a9dX2UKGgGR0Bw3HogV45caAdL+2gIR0CWRMAhB7eEdX2UKGgGR0BwKfB55Z8saAdNAgFoCEdAlkT80UGmk3V9lChoBkdAb8ayRjjJdWgHS71oCEdAlkYU+cH4XXV9lChoBkdAcySnWattAWgHTRcBaAhHQJZGl/MGHHp1fZQoaAZHQHDWAvQF9rpoB0vVaAhHQJZHxvNu+AV1fZQoaAZHQGVZlXJYDDFoB03oA2gIR0CWSgGWldkbdWUu"
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
PPO_1M_LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a05327f6d5323867d9d8c3d14ef0a3ca39ae6350e70fdf9d630f0b29b03fc3c
3
  size 88362
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fa0b0bcd3dfbb27e59dca5427a1acb0c068a548e533b7cfc3e4966fb4087e39
3
  size 88362
PPO_1M_LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:989984671b43832feb07beb397559756a58679e88d56859450c54f5b56af53e8
3
  size 43762
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:744a108159e3422b6cf452bdc5dad8e1546a6420d84fbbc46f93d677c3fd701c
3
  size 43762
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 245.99 +/- 82.76
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 249.08 +/- 38.67
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7b6a3ce4c5e0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7b6a3ce4c670>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7b6a3ce4c700>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7b6a3ce4c790>", "_build": "<function ActorCriticPolicy._build at 0x7b6a3ce4c820>", "forward": "<function ActorCriticPolicy.forward at 0x7b6a3ce4c8b0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7b6a3ce4c940>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7b6a3ce4c9d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7b6a3ce4ca60>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7b6a3ce4caf0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7b6a3ce4cb80>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7b6a3ce4cc10>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7b69dac91e40>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1720110596510561847, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADAVWb6ID4a8JqoSO9fZODkGvAI+U443ugAAgD8AAIA/kzBEvhydWrxn4IA79WyEOeZXxT3vLJ26AACAPwAAgD/gUgm+VOC0P/Lc776lAre+w8jrvWKj270AAAAAAAAAAJomyrz/HSc/qWU3Pbb/077JAAU7jdlwPQAAAAAAAAAAZtLouyrqqT94VHG9XzbpvvPfy7tm+Rm8AAAAAAAAAADzMsI9KSQUugFQAbkCzfezC6ouOwOLGjgAAAAAAACAP9NPY769RHw8cw2lPCGSDTySaVy+S3YvPQAAgD8AAIA/mnOFvFhLAD8CECa9V8fWvsgUzTwl8vs8AAAAAAAAAAAmbSy+hpqFPp0DVT1tioy+DrUqvEIjWzwAAAAAAAAAADNFrzz2EF+6egmmtu7+QbLk82w78AvCNQAAgD8AAIA/OjcyvsPtdLwKoIi7d1bwuf2j5T3plME6AACAPwAAgD8Yuau+HAePvSDa+7kzg/y4FDe2PnYXbjkAAIA/AACAPwDJjL3DaXG6RqibtZWGULAnwq061k2yNAAAgD8AAIA/zgqCvlKxzDxSpYQ6jjscudhXX74A87C5AACAPwAAgD8gHiy+qL+avIpUiLyjzSa7RzsJPk5/AzwAAIA/AACAP4DY1T1gxL4/2p/7PrKxnb3HPJw9mmM7PgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV/QsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQG3r2FFlTWKMAWyUS+yMAXSUR0CVreXgLqlhdX2UKGgGR0Bgy/T/hl19aAdN6ANoCEdAla3xxYJVsHV9lChoBkdAbkgZXMhX82gHTXkBaAhHQJWut46fapR1fZQoaAZHQHD/67yxzJZoB0v9aAhHQJWu9iH6/It1fZQoaAZHQG7dmwaBI4FoB0vhaAhHQJWvXt3OfNB1fZQoaAZHQHCay7GvOhVoB0vyaAhHQJWv2JtSAH51fZQoaAZHQHFwNkFwDNhoB00WAWgIR0CVsHoL5RCQdX2UKGgGR0BYi0SElE7XaAdN6ANoCEdAlbFIgA6uGXV9lChoBkdAb0oaLGaQWGgHS+poCEdAlbHfomoitHV9lChoBkdAbfL5KODJ2mgHS9xoCEdAlbIy8WbgCXV9lChoBkdAcdLsCDEm6WgHTQ4BaAhHQJWybg9/z8R1fZQoaAZHQG/zk0SAYpFoB022A2gIR0CVsoFpwjt5dX2UKGgGR0BxAiU0Nz8xaAdL9WgIR0CVsvhkAggYdX2UKGgGR0BxGyWJJoTPaAdLzWgIR0CVs059Vmz0dX2UKGgGR0Bwx1UyYXwcaAdL1mgIR0CVs6GyHEdedX2UKGgGR0BxbC/fwZwXaAdNBAFoCEdAlbPZmRNh3XV9lChoBkdAchyhHskY42gHS91oCEdAlbU4ESuhbnV9lChoBkdAcBkT1kDp1WgHS/hoCEdAlbVQudwvQHV9lChoBkdARFECkoF3ZGgHS79oCEdAlbZIN3GGVXV9lChoBkdAcUSxKg7HQ2gHTR0BaAhHQJW2i5nUUfx1fZQoaAZHQHIxgFTvRZ5oB00PAWgIR0CVtxmdy1eCdX2UKGgGR0Bv6j1uivgWaAdLzmgIR0CVt2Fj/dZadX2UKGgGR0BwUwqd6LOzaAdNDQFoCEdAlbe287IT5HV9lChoBkdAcNz+fywwCmgHS+xoCEdAlbjdAood/HV9lChoBkdANOrlmvnr6mgHS8FoCEdAlbjp2yLQ5XV9lChoBkdAcKMEqUeMh2gHS/poCEdAlbk5+hGpdnV9lChoBkdAcJPr92ovSWgHTQoBaAhHQJW5bJ5mh/R1fZQoaAZHQHCghPfsNUhoB0v8aAhHQJW54ntv4ud1fZQoaAZHQGwzGbCrLhdoB0v6aAhHQJW6MWfseGR1fZQoaAZHQHHjLG7z06JoB0vZaAhHQJW7Sp6yB091fZQoaAZHQG8gzyJ9AopoB0vqaAhHQJW73ndO6/Z1fZQoaAZHQHBEySJTER9oB0vqaAhHQJW89SR8twt1fZQoaAZHQHDpxTn7pFFoB01KAWgIR0CVvSXZ5AyEdX2UKGgGR0Bxcm+De0ojaAdL2GgIR0CVvU+g13t8dX2UKGgGR0Bhyb72tdRjaAdN6ANoCEdAlb3pNfw7T3V9lChoBkdAcd8PYWcjJWgHTQIBaAhHQJW9+dbxEv11fZQoaAZHQG3Aj5bhWHVoB0vraAhHQJW+HIMjNY91fZQoaAZHQHAN1BQemvZoB00BAWgIR0CVvwlWfbsXdX2UKGgGR0BuDjobGWD6aAdL5WgIR0CVv3oTfzjFdX2UKGgGR0BwJuifxtpFaAdL1mgIR0CVv/wfyPMjdX2UKGgGR0BvwcEJSiudaAdL7mgIR0CVwDDNyHVPdX2UKGgGR0Bw0wQSSNfgaAdL/2gIR0CVwHkCFK02dX2UKGgGR0BxNNEofCAMaAdNJQFoCEdAlcEwDq4YrXV9lChoBkdAbzE+6iCaqmgHTRkBaAhHQJXCISRKYiR1fZQoaAZHQHJ8ItQKrrBoB0v8aAhHQJXDBYigTRJ1fZQoaAZHQG9d8zQ/oq1oB0vaaAhHQJXDEyHmA9V1fZQoaAZHQHAJLEtNBWxoB0vsaAhHQJXDuruIAOt1fZQoaAZHQG+frQokRjBoB0vaaAhHQJXEBc1O0sx1fZQoaAZHQG1jTLfUF0RoB0vmaAhHQJXESzcAR051fZQoaAZHQHEaT7MxGlRoB00HAWgIR0CVxKIy0rsjdX2UKGgGR0Bws8sMAmzCaAdNTQFoCEdAlcS44p+c6XV9lChoBkdAcDK5mh/RV2gHS/BoCEdAlcTFx0dRznV9lChoBkdAb591ZkkKNWgHS9ZoCEdAlcT6WHDaXnV9lChoBkdAbSUIvalDW2gHS/NoCEdAlcadlVcUunV9lChoBkdAa8hOsT37DWgHS+poCEdAlcbbSVnmJXV9lChoBkdAceuO09hZyWgHTRUBaAhHQJXHDSx7iQ11fZQoaAZHQG+fF2vB7/poB0vvaAhHQJXHrx+az/p1fZQoaAZHQHDkmmYSg5BoB00EAWgIR0CVyUaDf3vhdX2UKGgGR0BkYEkKNQ0oaAdN6ANoCEdAlcm7QTmGNHV9lChoBkdAbdPsxfv4NGgHS/FoCEdAlcny+HrQgXV9lChoBkdAbbF1jiGWU2gHS8NoCEdAlcqA/s3Q2XV9lChoBkdAb69lzU7SzGgHS+BoCEdAlcqVtGd7OXV9lChoBkdAcT7pLmITG2gHS+VoCEdAlcsdC/oJRnV9lChoBkdAb91yH2ys0mgHTQIBaAhHQJXLaveP7vZ1fZQoaAZHQG3FslTm4iJoB0vVaAhHQJXLc2Q4jr11fZQoaAZHQHBd6Jyhi9ZoB0vvaAhHQJXL2xhUipx1fZQoaAZHQHDtg2VE/jdoB0v9aAhHQJXMaPq9oOB1fZQoaAZHQHL4VHrhR65oB0vSaAhHQJXOCDzyz5Z1fZQoaAZHQG74MQVbiZRoB0vraAhHQJXOZKHwgDB1fZQoaAZHQHJIATZg5R1oB0v7aAhHQJXPTVJ+UhV1fZQoaAZHQG3NdvKlpGpoB0vfaAhHQJXPdEiMYMx1fZQoaAZHQHLtOIZZSvVoB0vkaAhHQJXSIXgtOEd1fZQoaAZHQHEy5DRc/t9oB0vxaAhHQJXSSNn5BTp1fZQoaAZHQHFR2ahHskZoB0v3aAhHQJXTGe5Fw1l1fZQoaAZHQG2eJHZsbedoB0voaAhHQJXTGWldkax1fZQoaAZHQG+4px3mmtRoB0vfaAhHQJXTZvES/TN1fZQoaAZHQG4kUhNdqtZoB0vqaAhHQJXULvBrN4Z1fZQoaAZHQHD3eafBeoloB00MAmgIR0CV1G1uzhP1dX2UKGgGR0BwR5/Aj6eoaAdL9WgIR0CV1QyiVSn+dX2UKGgGR0BwcdpN9H+ZaAdNMQFoCEdAldWg+EAYHnV9lChoBkdAccfjNY8uBmgHS99oCEdAldYiwnpjc3V9lChoBkdAb6yhxo7FKmgHS81oCEdAldaLZJ04i3V9lChoBkdAbpdzbvgFYGgHS/5oCEdAldcyWRigCnV9lChoBkdAcL+qtYB/7WgHTUsBaAhHQJXXwutfXwt1fZQoaAZHQG8gNHpbD/FoB00SAWgIR0CV2HkT6BRRdX2UKGgGR0BxFIzhxYJWaAdL9GgIR0CV2cA7xNItdX2UKGgGR0BsC7ytmtheaAdL42gIR0CV2iD15B1LdX2UKGgGR0BvemUliSaFaAdL0mgIR0CV2nDTz/ZNdX2UKGgGR0Bxmf4CZF5OaAdNDgFoCEdAldqATh5xBHV9lChoBkdAcMPRfF72MGgHS9toCEdAldqI0EX+EXV9lChoBkdAcLXanJkoW2gHS/9oCEdAldq/fTCtR3V9lChoBkdAR8NmjCYTkGgHS9RoCEdAlduoIjW07nV9lChoBkdAa1MdGy5ZsGgHS/FoCEdAldvW16Vt43V9lChoBkdAcUbEOiFj/mgHS+BoCEdAld0NxlxwQ3V9lChoBkdAbher3j+72GgHS+xoCEdAld8B1LamGnV9lChoBkdAbpCIXTEzf2gHS+FoCEdAld+GcFyJbnV9lChoBkdAXiMXcgyM1mgHTegDaAhHQJXfmnhsImh1fZQoaAZHQHDZt+b3Gn5oB0veaAhHQJXhoqMFUyZ1fZQoaAZHQG0dS3b212JoB0vyaAhHQJXh5tSAH3V1fZQoaAZHQHFNXP/rB0poB0vmaAhHQJXiLfxc3VF1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.3.0+cu121", "GPU Enabled": "True", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x799e1e081bd0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x799e1e081c60>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x799e1e081cf0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x799e1e081d80>", "_build": "<function ActorCriticPolicy._build at 0x799e1e081e10>", "forward": "<function ActorCriticPolicy.forward at 0x799e1e081ea0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x799e1e081f30>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x799e1e081fc0>", "_predict": "<function ActorCriticPolicy._predict at 0x799e1e082050>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x799e1e0820e0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x799e1e082170>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x799e1e082200>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x799e1e018ec0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1720160375106397861, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAANPxQD5O3rC8OiVtO6d2zLk3Oh2+8U6dugAAgD8AAIA/OtU8vlx4dbyWnB07rF9IOcd62z2fHEi6AACAPwAAgD/NU8y9e4SaukHHvT3JUUM2J+cAuwa/OjUAAIA/AAAAAACQl7xBk4w/7Pu1u7qpTb/gjm28XouoPAAAAAAAAAAAzQqMvNEkmT83+wC+NyBRv7PambySBJM8AAAAAAAAAAAAVMY9u6j3PcZLWD0DRTy+XYSYPQtfer0AAAAAAAAAAD3ym76p0zY+gTxIPrgHhb4Y26W8WhqZPQAAAAAAAAAApgtFPnt1oLw5b766Kl8MORnWDr6emfE5AACAPwAAgD9a9pW9hUvMuUIuGDNz7ZOwuQgyuwn9wrMAAIA/AACAPxp9+z3kCnQ+G7P8PMetxb7vcAg9wjVwPAAAAAAAAAAAM3U0PZT8k7xS6aq8wQr/vIVeOb0Gvn6+AACAPwAAgD+G/zc+mzK6vD4cpLqFPhI5YcYivmbS4DkAAIA/AACAP/anij67Phw/2tIPPDPOBb+CzxA+76EkvgAAAAAAAAAA0yMfPoXStLtIRg29Wh/aOikoH71VxNg7AACAPwAAgD/63DE+4ZyHvItkwzqq1xG5S37qveo5AroAAIA/AACAP/rRjD7IspU+q9xyvU4Qqb5dGZE9Y5T9OwAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVAQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHFkxXXAdn2MAWyUTQ4BjAF0lEdAlaMG9+PRzHV9lChoBkdAc32Dr7fpEGgHTRsBaAhHQJYCud9Ujs51fZQoaAZHQHAZUdaMaS9oB0u+aAhHQJYC8N6PbPB1fZQoaAZHQHBZ3AAQxvhoB0vVaAhHQJYDsriEQGx1fZQoaAZHQGKVNwaR6nloB03oA2gIR0CWA8SR8twrdX2UKGgGR0BxGZsEaESNaAdL2GgIR0CWBSKzRhMKdX2UKGgGR0BxVcqFyq+8aAdLwmgIR0CWBb9iMHbAdX2UKGgGR0Bu+ivRqoIfaAdLuGgIR0CWBwWpIczZdX2UKGgGR0Bx7OyNXHR1aAdNOAFoCEdAlgfvGACnxnV9lChoBkdAcpqMdLg4wWgHTQoBaAhHQJYI2p0fYBh1fZQoaAZHQHC4aoIfKZFoB0u1aAhHQJYJZSDRMOB1fZQoaAZHQHJPSrgflp5oB0vPaAhHQJYKJUEPlMh1fZQoaAZHQHKgbR4QjD9oB01iAWgIR0CWClXkYGdJdX2UKGgGR0BwszjvNNahaAdLx2gIR0CWDFRWtEG8dX2UKGgGR0BxPFkK/mDEaAdLzWgIR0CWDovx6OYIdX2UKGgGR0Bu3sQ2/BWQaAdLvmgIR0CWD/8CgbqAdX2UKGgGR0BvaeoLofSyaAdLs2gIR0CWEWMxXXAedX2UKGgGR0BfAabayrxRaAdN6ANoCEdAlhG4hdMTOHV9lChoBkdAcL8b8WKuS2gHS+RoCEdAlhLXVbzK93V9lChoBkdAZPq1BMSK32gHTegDaAhHQJYUABXCCSR1fZQoaAZHQHGslKsdT5xoB0vsaAhHQJYUcVsUIs11fZQoaAZHQHI3ZHqeK9BoB0u1aAhHQJYUzwkPczt1fZQoaAZHQGP9E56t1ZFoB03oA2gIR0CWF8Lr5ZbIdX2UKGgGR0By6u3gDRtxaAdNrQFoCEdAlhiGEkB0ZHV9lChoBkdAcO5xWkrPMWgHS8doCEdAlhkFEE1VHXV9lChoBkdAcGtdyksSTWgHS6JoCEdAlhq4JiRW93V9lChoBkdAcNC+MIeHSGgHS9JoCEdAlhtx8lXzUnV9lChoBkdAbx073fyf+WgHS7JoCEdAlhyQvYe1bHV9lChoBkdAcF93gDRtxmgHS+NoCEdAlh2uKjzqbHV9lChoBkdAX66hXbM5fmgHTegDaAhHQJYfVG4I8hd1fZQoaAZHQHIc4TfzjFRoB0voaAhHQJYfple4Tbp1fZQoaAZHQG8IO+RHPNVoB0usaAhHQJYgvyhBZ6l1fZQoaAZHQHEvqzZ6D5FoB0vdaAhHQJYhptoBaLZ1fZQoaAZHQF7jNet0V8FoB03oA2gIR0CWIbCKaXrudX2UKGgGR0ByciBkI5YHaAdLqmgIR0CWIdR8+iaidX2UKGgGR0BxyDfYSQHSaAdL2WgIR0CWIf1ejVQRdX2UKGgGR0BjnnJ9y926aAdN6ANoCEdAliKE3S8aoHV9lChoBkdAbtzT3IuGsWgHTUwBaAhHQJYjSjnFHax1fZQoaAZHQHCOtrGipNtoB0vNaAhHQJYjWqCHymR1fZQoaAZHQG+cpR4yGi5oB0u5aAhHQJYjYa2nbZh1fZQoaAZHQHIhyqABkqdoB0u5aAhHQJYliLEUCaJ1fZQoaAZHQHE+b/XGwRpoB0vIaAhHQJYlt1SwW311fZQoaAZHQHGoT0th/iJoB0upaAhHQJYl+lsP8Q91fZQoaAZHQHJEvF3pwCNoB0uvaAhHQJYm9AJLM9t1fZQoaAZHQHFoE6o2n89oB00iAWgIR0CWJ0Wa+evqdX2UKGgGR0B0gRLi++M7aAdLtmgIR0CWKBFKCg9NdX2UKGgGR0BwnrGtITXbaAdL52gIR0CWKMR1HOKPdX2UKGgGR0ByHuQjlgc+aAdL+2gIR0CWKb53Tuv2dX2UKGgGR0ByD2CGvfTDaAdNAwFoCEdAlinZ8neBQXV9lChoBkdAcg+lC1JDmmgHS9VoCEdAlinilenhsXV9lChoBkdAb5qU6gdwN2gHS9RoCEdAlinshHLA6HV9lChoBkdAcLECE6DGtWgHS91oCEdAlio+lwcYInV9lChoBkdAYn4E+PikwmgHTegDaAhHQJYrG5Xlr/N1fZQoaAZHQGFNszl90A9oB03oA2gIR0CWKyr0J4SpdX2UKGgGR0ByYLr8iwB6aAdL32gIR0CWLLX7Lt/ndX2UKGgGR0BgACkqMFUyaAdN6ANoCEdAli5ee4Cp33V9lChoBkdAcXeOHWSU1WgHS6RoCEdAli5qWw/xD3V9lChoBkdAcGEus90RvmgHTQgBaAhHQJYuzoxHoX91fZQoaAZHQHBT5drwe/5oB0vvaAhHQJYvFoFmnO11fZQoaAZHQHFYFn27FsJoB0u7aAhHQJYvNFQVKwp1fZQoaAZHQHCGug13t8hoB0vBaAhHQJYvVWtEG7l1fZQoaAZHQHFq21UlzEJoB0vpaAhHQJYvhUbT+eh1fZQoaAZHQHDPDWCmMwVoB0u3aAhHQJYwFvuPV/d1fZQoaAZHQG38uXeFcptoB0vAaAhHQJYwXexfOUt1fZQoaAZHQHEDPhIe5nVoB02BAWgIR0CWML1EVnEmdX2UKGgGR0ByAnBdld1MaAdNTwFoCEdAljDhU70WdnV9lChoBkdAclE0fHPu5WgHS/9oCEdAljDrteD3/XV9lChoBkdAbsF/e+Eh7mgHS7doCEdAljL3w9aEBnV9lChoBkdAcILmEXcgyWgHS7loCEdAljQyp71Iy3V9lChoBkdAcM76ol2NemgHS9BoCEdAljSAiml67nV9lChoBkdAbxLGACnxa2gHS7ZoCEdAljTLKV6eG3V9lChoBkdAbxVJZGKAKGgHTTwBaAhHQJY1LOC5Etx1fZQoaAZHQHAvTbN8ma9oB0u+aAhHQJY1w23rleZ1fZQoaAZHQHG684DLbHpoB0vMaAhHQJY2WBlMAWB1fZQoaAZHQGLn64MF2V5oB03oA2gIR0CWNnKO1fE5dX2UKGgGR0Bw48a86FM7aAdL8WgIR0CWNsvxpcoqdX2UKGgGR0BxXZVLi++NaAdNRgFoCEdAljeJR0lqrXV9lChoBkdAcgyakRBeHGgHTRIBaAhHQJY4Yi7kGRp1fZQoaAZHQHEnijcmBvtoB0vdaAhHQJY5XM2WIGh1fZQoaAZHQHC+7iIcinpoB0uwaAhHQJY6WB/Zuht1fZQoaAZHQHPpy4Bmwq1oB0vTaAhHQJY7Equr6tV1fZQoaAZHQHJJgRf4REpoB00CAWgIR0CWPEzxPO6edX2UKGgGR0Bww2aa1Cw9aAdLwmgIR0CWPEycTakAdX2UKGgGR0BxZsf8uSOjaAdL2mgIR0CWPG6mfoRqdX2UKGgGR0Bt3CxNZeRgaAdLvmgIR0CWPK/vv0AcdX2UKGgGR0BxaSnNxEORaAdL12gIR0CWPQ5lvqC6dX2UKGgGR0BxYqAYpDu0aAdLtWgIR0CWPyk1Mue0dX2UKGgGR0Bxe/+kxh2GaAdL4GgIR0CWP4AuIyj6dX2UKGgGR0BycH9JjDsMaAdNdwFoCEdAlj++jIq9XnV9lChoBkdAb/DTAnDziGgHS8toCEdAlkD0hNdqtnV9lChoBkdAcc9ufEn9emgHS95oCEdAlkJcrZrYXnV9lChoBkdAct6L0SRKYmgHTY8CaAhHQJZCs1fmcON1fZQoaAZHQGcK/YSQHRloB03oA2gIR0CWQ49E1EVndX2UKGgGR0BxDYf9xZMdaAdL6WgIR0CWREUFB6a9dX2UKGgGR0Bw3HogV45caAdL+2gIR0CWRMAhB7eEdX2UKGgGR0BwKfB55Z8saAdNAgFoCEdAlkT80UGmk3V9lChoBkdAb8ayRjjJdWgHS71oCEdAlkYU+cH4XXV9lChoBkdAcySnWattAWgHTRcBaAhHQJZGl/MGHHp1fZQoaAZHQHDWAvQF9rpoB0vVaAhHQJZHxvNu+AV1fZQoaAZHQGVZlXJYDDFoB03oA2gIR0CWSgGWldkbdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Thu Jun 27 21:05:47 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.3.0+cu121", "GPU Enabled": "True", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 245.99350961740532, "std_reward": 82.75747283201814, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-07-04T17:14:29.913607"}
 
1
+ {"mean_reward": 249.0848227566832, "std_reward": 38.66584002925681, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-07-05T07:05:40.790053"}