Mriganka1999
commited on
Commit
•
9b69dac
1
Parent(s):
a9c56c1
Initial commit
Browse files- README.md +37 -0
- config.json +1 -0
- replay.mp4 +0 -0
- results.json +1 -0
- td3-PandaPickAndPlaceDense-v3.zip +3 -0
- td3-PandaPickAndPlaceDense-v3/_stable_baselines3_version +1 -0
- td3-PandaPickAndPlaceDense-v3/actor.optimizer.pth +3 -0
- td3-PandaPickAndPlaceDense-v3/critic.optimizer.pth +3 -0
- td3-PandaPickAndPlaceDense-v3/data +114 -0
- td3-PandaPickAndPlaceDense-v3/policy.pth +3 -0
- td3-PandaPickAndPlaceDense-v3/pytorch_variables.pth +3 -0
- td3-PandaPickAndPlaceDense-v3/system_info.txt +9 -0
- vec_normalize.pkl +3 -0
README.md
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: stable-baselines3
|
3 |
+
tags:
|
4 |
+
- PandaPickAndPlaceDense-v3
|
5 |
+
- deep-reinforcement-learning
|
6 |
+
- reinforcement-learning
|
7 |
+
- stable-baselines3
|
8 |
+
model-index:
|
9 |
+
- name: TD3
|
10 |
+
results:
|
11 |
+
- task:
|
12 |
+
type: reinforcement-learning
|
13 |
+
name: reinforcement-learning
|
14 |
+
dataset:
|
15 |
+
name: PandaPickAndPlaceDense-v3
|
16 |
+
type: PandaPickAndPlaceDense-v3
|
17 |
+
metrics:
|
18 |
+
- type: mean_reward
|
19 |
+
value: -10.67 +/- 3.74
|
20 |
+
name: mean_reward
|
21 |
+
verified: false
|
22 |
+
---
|
23 |
+
|
24 |
+
# **TD3** Agent playing **PandaPickAndPlaceDense-v3**
|
25 |
+
This is a trained model of a **TD3** agent playing **PandaPickAndPlaceDense-v3**
|
26 |
+
using the [stable-baselines3 library](https://github.com/DLR-RM/stable-baselines3).
|
27 |
+
|
28 |
+
## Usage (with Stable-baselines3)
|
29 |
+
TODO: Add your code
|
30 |
+
|
31 |
+
|
32 |
+
```python
|
33 |
+
from stable_baselines3 import ...
|
34 |
+
from huggingface_sb3 import load_from_hub
|
35 |
+
|
36 |
+
...
|
37 |
+
```
|
config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVNwAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnRkMy5wb2xpY2llc5SMEE11bHRpSW5wdXRQb2xpY3mUk5Qu", "__module__": "stable_baselines3.td3.policies", "__doc__": "\n Policy class (with both actor and critic) for TD3 to be used with Dict observation spaces.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ", "__init__": "<function MultiInputPolicy.__init__ at 0x79f7ba9d32e0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x79f7ba9d5bc0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1000000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1719148534956247250, "learning_rate": 0.001, "tensorboard_log": null, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWViwIAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAn5SXP6UzKD8phss81C/6vqgRQj8phss8rz+Nv3HgHj+cnMs81z8Mv2zHd79q5co8lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAfomHv8HSqD9ryYq/mLTpvj7wer9ryYq/jcB8vylHQTxryYq/+9a/v0yClj8TR4W/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWMAEAAAAAAADpyXu/Wz6HP7RG0T29u5e+i94DP0KGJD+o8oC/n5SXP6UzKD8phss88C0CPI0FFLucnZC7eSeyOzmnDTt/JkA8q4ZFuoaoU7sn4oe75bgCvtXfdj+Isgm+sGFyvg2oTD8BGYO9IJCCv9Qv+r6oEUI/KYbLPAam8js5y7y6iNgmO55K9TvZw5A7fyZAPGWGRbqXqFO76WGPuovM5D45sAo/5EJtPA81LkDQF2w/hAE2QAVWiz+vP42/ceAeP5ycyzy9vgM8/EbdurgaNLoRMq07ESavO4rPMDz+0jS8KKQcvASQE7tQAnQ/W3lZP94ECz/woKA+qfiJPmOkMrwakIK/1z8Mv2zHd79q5co8/U0TPNU4zbpAZLO6Wi23O/swSjt+JkA8VotFuripU7vn/EC7lGgOSwRLE4aUaBJ0lFKUdS4=", "achieved_goal": "[[ 1.184223 0.65703803 0.02484425]\n [-0.48864615 0.7580819 0.02484425]\n [-1.103506 0.6206122 0.02485495]\n [-0.5478491 -0.9678867 0.0247676 ]]", "desired_goal": "[[-1.0588834 1.3189317 -1.0842718 ]\n [-0.45645595 -0.9802283 -1.0842718 ]\n [-0.9873131 0.01179675 -1.0842718 ]\n [-1.4987482 1.1758513 -1.0412315 ]]", "observation": "[[-9.8354965e-01 1.0565904e+00 1.0218564e-01 -2.9635420e-01\n 5.1511449e-01 6.4267361e-01 -1.0074053e+00 1.1842231e+00\n 6.5703803e-01 2.4844246e-02 7.9455227e-03 -2.2586316e-03\n -4.4133198e-03 5.4368344e-03 2.1614565e-03 1.1727928e-02\n -7.5350207e-04 -3.2296493e-03 -4.1468325e-03]\n [-1.2765844e-01 9.6435291e-01 -1.3447011e-01 -2.3670077e-01\n 7.9943925e-01 -6.4012535e-02 -1.0200233e+00 -4.8864615e-01\n 7.5808191e-01 2.4844246e-02 7.4050454e-03 -1.4403827e-03\n 2.5458653e-03 7.4857017e-03 4.4178781e-03 1.1727928e-02\n -7.5349800e-04 -3.2296532e-03 -1.0939214e-03]\n [ 4.4687304e-01 5.4175144e-01 1.4481280e-02 2.7219884e+00\n 9.2223835e-01 2.8438425e+00 1.0885626e+00 -1.1035060e+00\n 6.2061220e-01 2.4854951e-02 8.0410810e-03 -1.6882117e-03\n -6.8704365e-04 5.2855094e-03 5.3451140e-03 1.0791669e-02\n -1.1036633e-02 -9.5606223e-03 -2.2516260e-03]\n [ 9.5316029e-01 8.4950799e-01 5.4304302e-01 3.1372786e-01\n 2.6947525e-01 -1.0903451e-02 -1.0200226e+00 -5.4784912e-01\n -9.6788669e-01 2.4767596e-02 8.9907618e-03 -1.5657196e-03\n -1.3686493e-03 5.5901231e-03 3.0851949e-03 1.1727927e-02\n -7.5357163e-04 -3.2297205e-03 -2.9447617e-03]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWViwIAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAlQjZPU80bD1hwaM8DV8wvWtmiD1hwaM8TF7IvQADXz2ZwaM8iflFvT4nsL3Qv6M8lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAYS29vSuZ6j0K16M8f9cjvU19rb0K16M8U2+wvYG3pToK16M81r4Fvs4z0T2DTrs8lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWMAEAAAAAAADoL7K+uOxlPvHVdT49qCO+6vLXPYroXz68y/c5lQjZPU80bD1hwaM8NIliNyXybrdFdtS5khDFtzfAqLd08mwt7A5bMjWtZzKK8RO6Z1f/vTCkRz4jdUY+JGUTvgVGQj6hVaK6N9yDNQ1fML1rZog9YcGjPGz0brcNh2I3i9LIOZDAqDdTEcU3TJhsLVyuZzKpE1sy7/ITOq/NzjzDknM9BUdkPgLLJD+9i2c+HFJnPxVroT1MXsi9AANfPZnBozwRa5o3qRerNqhHjTdOFeC3dbItOIlBrLdyi/O64licumv4DjnPIiE+hO8hPiAMpz4jDSo7UasFPQJ4ejxJeoc1iflFvT4nsL3Qv6M8ONiMOE46GzcHMH24FrKpt0LuF7bQRVeslyZRL6kWWi4sf/u4lGgOSwRLE4aUaBJ0lFKUdS4=", "achieved_goal": "[[ 0.1059734 0.05766707 0.01998967]\n [-0.0430594 0.0666016 0.01998967]\n [-0.09783611 0.05444622 0.01998978]\n [-0.04833368 -0.08601235 0.01998892]]", "desired_goal": "[[-0.09237171 0.11454996 0.02 ]\n [-0.04000043 -0.08471165 0.02 ]\n [-0.08614983 0.00126432 0.02 ]\n [-0.1306108 0.10214959 0.02286459]]", "observation": "[[-3.48021746e-01 2.24535823e-01 2.40073934e-01 -1.59821466e-01\n 1.05443791e-01 2.18660504e-01 4.72633052e-04 1.05973400e-01\n 5.76670729e-02 1.99896712e-02 1.35025948e-05 -1.42422841e-05\n -4.05239087e-04 -2.34919462e-05 -2.01166677e-05 1.34688823e-11\n 1.27508706e-08 1.34853524e-08 -5.64359711e-04]\n [-1.24678425e-01 1.94962263e-01 1.93806216e-01 -1.43940508e-01\n 1.89720228e-01 -1.23851385e-03 9.82435154e-07 -4.30593975e-02\n 6.66015968e-02 1.99896712e-02 -1.42428144e-05 1.35020937e-05\n 3.83038394e-04 2.01168295e-05 2.34922973e-05 1.34488636e-11\n 1.34856144e-08 1.27519479e-08 5.64380491e-04]\n [ 2.52445620e-02 5.94661348e-02 2.22927168e-01 6.43722653e-01\n 2.26118997e-01 9.03596640e-01 7.88175240e-02 -9.78361070e-02\n 5.44462204e-02 1.99897755e-02 1.84080873e-05 5.09895153e-06\n 1.68418774e-05 -2.67128016e-05 4.14126152e-05 -2.05345150e-05\n -1.85809867e-03 -1.19283446e-03 1.36347182e-04]\n [ 1.57359347e-01 1.58140242e-01 3.26264381e-01 2.59477715e-03\n 3.26340832e-02 1.52874012e-02 1.00938735e-06 -4.83336784e-02\n -8.60123485e-02 1.99889243e-02 6.71599410e-05 9.25229506e-06\n -6.03646295e-05 -2.02292977e-05 -2.26394377e-06 -3.05920914e-12\n 1.90221491e-10 4.95875875e-11 -1.19923003e-04]]"}, "_episode_num": 20659, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwCpA44p+c6OMAWyUSzKMAXSUR0DJIOPStvGZdX2UKGgGR8AmxCYTj/+9aAdLMmgIR0DJIebeoDPodX2UKGgGR8ASDO1OTJQtaAdLMmgIR0DJIdzMJQchdX2UKGgGR8AjoCLdepn6aAdLMmgIR0DJIb6C17Y1dX2UKGgGR8Am7kwN9YwJaAdLMmgIR0DJIkMzGgjAdX2UKGgGR8Akl68g6ltTaAdLMmgIR0DJI7bMkhRqdX2UKGgGR7+Y9kjHGS6laAdLAWgIR0DJI8HozN2UdX2UKGgGR8AmYCCBf8dgaAdLMmgIR0DJI7Km2sq8dX2UKGgGR8AprP2wmmcfaAdLMmgIR0DJI5ThNucddX2UKGgGR8Amm33Hq/ucaAdLMmgIR0DJJAVJQLuydX2UKGgGR8AjJLgXMyJsaAdLMmgIR0DJJRHOKO1fdX2UKGgGR8Aqx1mrbQC0aAdLMmgIR0DJJQBu89OidX2UKGgGR8AtaO6unuRcaAdLMmgIR0DJJOJvUBn0dX2UKGgGR7+dI065oXbeaAdLAWgIR0DJJOt3B55adX2UKGgGR8AjlNcGC7K8aAdLMmgIR0DJJVFE7W/bdX2UKGgGR8Arpyc0+C9RaAdLMmgIR0DJJlyTOgQIdX2UKGgGR8AYxweeWfK7aAdLMmgIR0DJJkstTUAldX2UKGgGR8Aw719fCyhSaAdLMmgIR0DJJjX7zkIYdX2UKGgGR8AsYmpEQXhwaAdLMmgIR0DJJp4GOdXldX2UKGgGR8AiGP9UCJXRaAdLMmgIR0DJJ6XB1s+FdX2UKGgGR8AsR+yZ8a4uaAdLMmgIR0DJJ5Rwjt5VdX2UKGgGR8ArAF8ohIOIaAdLMmgIR0DJJ332IwdsdX2UKGgGR8AUSgdwNsnBaAdLMmgIR0DJJ+YeA/cGdX2UKGgGR8Aqq8zQ/oq1aAdLMmgIR0DJKQX7JnxsdX2UKGgGR8AkFjoZAIIGaAdLMmgIR0DJKPalxffGdX2UKGgGR8AqL8gpz90jaAdLMmgIR0DJKOkvsZ5zdX2UKGgGR8AHj9Q40dilaAdLMmgIR0DJKXDtXxOMdX2UKGgGR8An81ZTyauwaAdLMmgIR0DJKqplUZNxdX2UKGgGR8Apcxzq8lHCaAdLMmgIR0DJKpkxASnMdX2UKGgGR8AohDm8ujASaAdLMmgIR0DJKoOXXyy2dX2UKGgGR8ApXWattALRaAdLMmgIR0DJKuscABDHdX2UKGgGR8AtVOgxrSE2aAdLMmgIR0DJK/V6gM+edX2UKGgGR8AmBLJ0W/JvaAdLMmgIR0DJK+QUUO/ddX2UKGgGR8AtDX1anrIHaAdLMmgIR0DJK85At4A0dX2UKGgGR8AjsurZJ04jaAdLMmgIR0DJLDXz19ORdX2UKGgGR8ArC4vvjOs1aAdLMmgIR0DJLUHbKzRhdX2UKGgGR8ApjRUFSsKcaAdLMmgIR0DJLTB8D0UXdX2UKGgGR8ATlf9gnc+JaAdLMmgIR0DJLRrGPxQSdX2UKGgGR7+Xy/bj94u9aAdLAWgIR0DJLSEDGLk0dX2UKGgGR8AkwhC+lCTmaAdLMmgIR0DJLYIVqN6xdX2UKGgGR8Afm/L1VYITaAdLMmgIR0DJLoweq7yydX2UKGgGR8AFyydFvybyaAdLMmgIR0DJLnuzfJmvdX2UKGgGR8AatNN8E3bVaAdLMmgIR0DJLmoz+FURdX2UKGgGR8AiUiBXjlxPaAdLMmgIR0DJLso2CNCJdX2UKGgGR8AxouYQarFPaAdLMmgIR0DJMBDh1klNdX2UKGgGR8AoqlpoK2KEaAdLMmgIR0DJMALgCOm0dX2UKGgGR8AZBY4hllK9aAdLMmgIR0DJL/6UmlZYdX2UKGgGR8AQwe6qbSZ0aAdLMmgIR0DJMH+0AtFsdX2UKGgGR8AqkrBj4HopaAdLMmgIR0DJMZObZvkzdX2UKGgGR8Ah1fZ26kIpaAdLMmgIR0DJMYN5Sm65dX2UKGgGR8Apaskpqh11aAdLMmgIR0DJMXgNVinYdX2UKGgGR8AlYbXpW3jNaAdLMmgIR0DJMdlM495hdX2UKGgGR8AlPuP3i704aAdLMmgIR0DJMuOdCmdidX2UKGgGR8Aj6eGO+7DmaAdLMmgIR0DJMtPMOf/WdX2UKGgGR8Aj/LwF1SwXaAdLMmgIR0DJMsM8NhE0dX2UKGgGR8AnOywfQrtmaAdLMmgIR0DJMybBhx5tdX2UKGgGR8AjeBg/keZHaAdLMmgIR0DJNC8yBTXKdX2UKGgGR8AqqE+xGDtgaAdLMmgIR0DJNB/9aUzLdX2UKGgGR8AlM3UhFEy+aAdLMmgIR0DJNA9Q0oBrdX2UKGgGR8AiBM2WIGhVaAdLMmgIR0DJNHMzXSSedX2UKGgGR8ArI7ihnJ1aaAdLMmgIR0DJNX316E8JdX2UKGgGR8AQy0v4/NaAaAdLMmgIR0DJNW19YwIudX2UKGgGR8AmCqo60Y0maAdLMmgIR0DJNVyZF5OadX2UKGgGR8AlXhky1uzhaAdLMmgIR0DJNc5sfq5cdX2UKGgGR8AtPJMg2ZRbaAdLMmgIR0DJNzQVCXyBdX2UKGgGR8AhqRh+fAbiaAdLMmgIR0DJNyOy/sVtdX2UKGgGR8AoNiS7oSteaAdLMmgIR0DJNxMmOU+tdX2UKGgGR8AmnSkTHsC1aAdLMmgIR0DJN3N1dPcjdX2UKGgGR8AcvRb8m8dxaAdLMmgIR0DJOH87MgU2dX2UKGgGR8AwOz9jwx33aAdLMmgIR0DJOG675Ec9dX2UKGgGR8AsffP5YYBOaAdLMmgIR0DJOF3Qtz0ZdX2UKGgGR8AZDub7TDwZaAdLMmgIR0DJOL/aL4vfdX2UKGgGR8AkR2fTTfBOaAdLMmgIR0DJOcs9IPK/dX2UKGgGR8AnXJK8L8aXaAdLMmgIR0DJObsSTQmedX2UKGgGR8Am13xFy7wsaAdLMmgIR0DJOatKNAC5dX2UKGgGR8Ao1eGfwqiHaAdLMmgIR0DJOg7U1AJLdX2UKGgGR8AY4z41xbSraAdLMmgIR0DJOxynHeabdX2UKGgGR8AVJBhQWN3oaAdLMmgIR0DJOwyc5Ke1dX2UKGgGR8AmTgxagVXWaAdLMmgIR0DJOvxfShJzdX2UKGgGR8Af3VTaTOgQaAdLMmgIR0DJO2FoWYWtdX2UKGgGR8AaiGFi8WbgaAdLMmgIR0DJPIkxREWqdX2UKGgGR8AbuLQ5WBBiaAdLMmgIR0DJPHvo5ggHdX2UKGgGR8AqfH4oJAt4aAdLMmgIR0DJPHVhoduHdX2UKGgGR8AtRWdVea8ZaAdLMmgIR0DJPPPqAz55dX2UKGgGR8AoX8CxNZeSaAdLMmgIR0DJPiNyFPBSdX2UKGgGR8AmVJqZc9nsaAdLMmgIR0DJPhNK9PDYdX2UKGgGR8AeI7uDzyz5aAdLMmgIR0DJPgJsGgSOdX2UKGgGR8AkiWcjJMg2aAdLMmgIR0DJPmQiNbTudX2UKGgGR8AhsDrZ8KG+aAdLMmgIR0DJP2rYmLLqdX2UKGgGR8AbTLHMlkYoaAdLMmgIR0DJP1q5PM0QdX2UKGgGR8AooVvddmg8aAdLMmgIR0DJP0lCRfWudX2UKGgGR8ApYixmkFfRaAdLMmgIR0DJP6pY9xIbdX2UKGgGR8AUzypaRp1zaAdLMmgIR0DJQLTgflp5dX2UKGgGR8Au4LJCBwuNaAdLMmgIR0DJQKWFg2IgdX2UKGgGR8AZ/zQNTcZcaAdLMmgIR0DJQJYVKwpwdX2UKGgGR8AYtkd3jdYXaAdLMmgIR0DJQPmyE+PjdX2UKGgGR8Aj15kbxVhkaAdLMmgIR0DJQgK5y2hJdX2UKGgGR8AbgBmwqy4XaAdLMmgIR0DJQfMuJ1q4dX2UKGgGR8AqSSXdCVrzaAdLMmgIR0DJQeKvcJt0dX2UKGgGR8AkARlpXZGsaAdLMmgIR0DJQkPcQAdXdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVhgAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKImJiYmJiYiJiYmJiYmIiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiImJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYllLg=="}, "_n_updates": 249975, "buffer_size": 1000000, "batch_size": 256, "learning_starts": 100, "tau": 0.005, "gamma": 0.99, "gradient_steps": 1, "optimize_memory_usage": false, "replay_buffer_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwQRGljdFJlcGxheUJ1ZmZlcpSTlC4=", "__module__": "stable_baselines3.common.buffers", "__annotations__": "{'observation_space': <class 'gymnasium.spaces.dict.Dict'>, 'obs_shape': typing.Dict[str, typing.Tuple[int, ...]], 'observations': typing.Dict[str, numpy.ndarray], 'next_observations': typing.Dict[str, numpy.ndarray]}", "__doc__": "\n Dict Replay buffer used in off-policy algorithms like SAC/TD3.\n Extends the ReplayBuffer to use dictionary observations\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n Disabled for now (see https://github.com/DLR-RM/stable-baselines3/pull/243#discussion_r531535702)\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ", "__init__": "<function DictReplayBuffer.__init__ at 0x79f7babf30a0>", "add": "<function DictReplayBuffer.add at 0x79f7babf3130>", "sample": "<function DictReplayBuffer.sample at 0x79f7babf31c0>", "_get_samples": "<function DictReplayBuffer._get_samples at 0x79f7babf3250>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x79f7ba918a00>"}, "replay_buffer_kwargs": {}, "train_freq": {":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>", ":serialized:": "gAWVYQAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLAWgAjBJUcmFpbkZyZXF1ZW5jeVVuaXSUk5SMBHN0ZXCUhZRSlIaUgZQu"}, "use_sde_at_warmup": false, "policy_delay": 2, "target_noise_clip": 0.5, "target_policy_noise": 0.2, "observation_space": {":type:": "<class 'gymnasium.spaces.dict.Dict'>", ":serialized:": "gAWVMgQAAAAAAACMFWd5bW5hc2l1bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwUZ3ltbmFzaXVtLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowNYm91bmRlZF9iZWxvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYDAAAAAAAAAAEBAZRoE4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoHCiWAwAAAAAAAAABAQGUaCBLA4WUaCR0lFKUjAZfc2hhcGWUSwOFlIwDbG93lGgcKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFksDhZRoJHSUUpSMBGhpZ2iUaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlIwIbG93X3JlcHKUjAUtMTAuMJSMCWhpZ2hfcmVwcpSMBDEwLjCUjApfbnBfcmFuZG9tlE51YowMZGVzaXJlZF9nb2FslGgNKYGUfZQoaBBoFmgZaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgnaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgsSwOFlGguaBwolgwAAAAAAAAAAAAgwQAAIMEAACDBlGgWSwOFlGgkdJRSlGgzaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgWaBloHCiWEwAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBlGggSxOFlGgkdJRSlGgnaBwolhMAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAZRoIEsThZRoJHSUUpRoLEsThZRoLmgcKJZMAAAAAAAAAAAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBZLE4WUaCR0lFKUaDNoHCiWTAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBlGgWSxOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YnVoLE5oEE5oPE51Yi4=", "spaces": "OrderedDict([('achieved_goal', Box(-10.0, 10.0, (3,), float32)), ('desired_goal', Box(-10.0, 10.0, (3,), float32)), ('observation', Box(-10.0, 10.0, (19,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVagIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBBfX2dlbmVyYXRvcl9jdG9ylJOUjAVQQ0c2NJRoMowUX19iaXRfZ2VuZXJhdG9yX2N0b3KUk5SGlFKUfZQojA1iaXRfZ2VuZXJhdG9ylIwFUENHNjSUjAVzdGF0ZZR9lChoPYoPgXom1R9zzxD9XYahopU7jANpbmOUihGJcbERIt8/Sc65c8qJGHiiAHWMCmhhc191aW50MzKUSwCMCHVpbnRlZ2VylEsAdWJ1Yi4=", "dtype": "float32", "bounded_below": "[ True True True True]", "bounded_above": "[ True True True True]", "_shape": [4], "low": "[-1. -1. -1. -1.]", "high": "[1. 1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": "Generator(PCG64)"}, "n_envs": 4, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVoAMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0sTQwx0AIgAfACDAYMBUwCUToWUjAVmbG9hdJSFlIwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwIPGxhbWJkYT6US2FDAgwAlIwOdmFsdWVfc2NoZWR1bGWUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxJL3Vzci9sb2NhbC9saWIvcHl0aG9uMy4xMC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGghfZR9lChoGGgPjAxfX3F1YWxuYW1lX1+UjCFnZXRfc2NoZWR1bGVfZm4uPGxvY2Fscz4uPGxhbWJkYT6UjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgZjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOUaAIoaAcoSwFLAEsASwFLAUsTQwSIAFMAlGgJKYwBX5SFlGgOjARmdW5jlEuFQwIEAZSMA3ZhbJSFlCl0lFKUaBVOTmgdKVKUhZR0lFKUaCRoPn2UfZQoaBhoNWgnjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlGgpfZRoK05oLE5oLWgZaC5OaC9oMUc/UGJN0vGp/IWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwhZRSlIWUaEZdlGhIfZR1hpSGUjAu"}, "actor_batch_norm_stats": [], "critic_batch_norm_stats": [], "actor_batch_norm_stats_target": [], "critic_batch_norm_stats_target": [], "system_info": {"OS": "Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Apr 28 14:29:16 UTC 2024", "Python": "3.10.12", "Stable-Baselines3": "2.3.2", "PyTorch": "2.3.0+cu121", "GPU Enabled": "False", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.29.1", "OpenAI Gym": "0.25.2"}}
|
replay.mp4
ADDED
Binary file (719 kB). View file
|
|
results.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"mean_reward": -10.667819579690695, "std_reward": 3.7359066905370724, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-06-23T16:56:36.052816"}
|
td3-PandaPickAndPlaceDense-v3.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d75238d637e4bc2862f3af4c5fd2691772bc738576d582fab24c82d11d816243
|
3 |
+
size 6402106
|
td3-PandaPickAndPlaceDense-v3/_stable_baselines3_version
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
2.3.2
|
td3-PandaPickAndPlaceDense-v3/actor.optimizer.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbb3c29f0afb3bd2887faff107f92bfcfbd3aabbd8144934bdc0d69fd073d47d
|
3 |
+
size 1060384
|
td3-PandaPickAndPlaceDense-v3/critic.optimizer.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85de8640797b66012d888361b52224f146677f439aa5c0332e17bb6f31a803d5
|
3 |
+
size 2130922
|
td3-PandaPickAndPlaceDense-v3/data
ADDED
@@ -0,0 +1,114 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"policy_class": {
|
3 |
+
":type:": "<class 'abc.ABCMeta'>",
|
4 |
+
":serialized:": "gAWVNwAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnRkMy5wb2xpY2llc5SMEE11bHRpSW5wdXRQb2xpY3mUk5Qu",
|
5 |
+
"__module__": "stable_baselines3.td3.policies",
|
6 |
+
"__doc__": "\n Policy class (with both actor and critic) for TD3 to be used with Dict observation spaces.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
|
7 |
+
"__init__": "<function MultiInputPolicy.__init__ at 0x79f7ba9d32e0>",
|
8 |
+
"__abstractmethods__": "frozenset()",
|
9 |
+
"_abc_impl": "<_abc._abc_data object at 0x79f7ba9d5bc0>"
|
10 |
+
},
|
11 |
+
"verbose": 1,
|
12 |
+
"policy_kwargs": {},
|
13 |
+
"num_timesteps": 1000000,
|
14 |
+
"_total_timesteps": 1000000,
|
15 |
+
"_num_timesteps_at_start": 0,
|
16 |
+
"seed": null,
|
17 |
+
"action_noise": null,
|
18 |
+
"start_time": 1719148534956247250,
|
19 |
+
"learning_rate": 0.001,
|
20 |
+
"tensorboard_log": null,
|
21 |
+
"_last_obs": {
|
22 |
+
":type:": "<class 'collections.OrderedDict'>",
|
23 |
+
":serialized:": "gAWViwIAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAn5SXP6UzKD8phss81C/6vqgRQj8phss8rz+Nv3HgHj+cnMs81z8Mv2zHd79q5co8lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAfomHv8HSqD9ryYq/mLTpvj7wer9ryYq/jcB8vylHQTxryYq/+9a/v0yClj8TR4W/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWMAEAAAAAAADpyXu/Wz6HP7RG0T29u5e+i94DP0KGJD+o8oC/n5SXP6UzKD8phss88C0CPI0FFLucnZC7eSeyOzmnDTt/JkA8q4ZFuoaoU7sn4oe75bgCvtXfdj+Isgm+sGFyvg2oTD8BGYO9IJCCv9Qv+r6oEUI/KYbLPAam8js5y7y6iNgmO55K9TvZw5A7fyZAPGWGRbqXqFO76WGPuovM5D45sAo/5EJtPA81LkDQF2w/hAE2QAVWiz+vP42/ceAeP5ycyzy9vgM8/EbdurgaNLoRMq07ESavO4rPMDz+0jS8KKQcvASQE7tQAnQ/W3lZP94ECz/woKA+qfiJPmOkMrwakIK/1z8Mv2zHd79q5co8/U0TPNU4zbpAZLO6Wi23O/swSjt+JkA8VotFuripU7vn/EC7lGgOSwRLE4aUaBJ0lFKUdS4=",
|
24 |
+
"achieved_goal": "[[ 1.184223 0.65703803 0.02484425]\n [-0.48864615 0.7580819 0.02484425]\n [-1.103506 0.6206122 0.02485495]\n [-0.5478491 -0.9678867 0.0247676 ]]",
|
25 |
+
"desired_goal": "[[-1.0588834 1.3189317 -1.0842718 ]\n [-0.45645595 -0.9802283 -1.0842718 ]\n [-0.9873131 0.01179675 -1.0842718 ]\n [-1.4987482 1.1758513 -1.0412315 ]]",
|
26 |
+
"observation": "[[-9.8354965e-01 1.0565904e+00 1.0218564e-01 -2.9635420e-01\n 5.1511449e-01 6.4267361e-01 -1.0074053e+00 1.1842231e+00\n 6.5703803e-01 2.4844246e-02 7.9455227e-03 -2.2586316e-03\n -4.4133198e-03 5.4368344e-03 2.1614565e-03 1.1727928e-02\n -7.5350207e-04 -3.2296493e-03 -4.1468325e-03]\n [-1.2765844e-01 9.6435291e-01 -1.3447011e-01 -2.3670077e-01\n 7.9943925e-01 -6.4012535e-02 -1.0200233e+00 -4.8864615e-01\n 7.5808191e-01 2.4844246e-02 7.4050454e-03 -1.4403827e-03\n 2.5458653e-03 7.4857017e-03 4.4178781e-03 1.1727928e-02\n -7.5349800e-04 -3.2296532e-03 -1.0939214e-03]\n [ 4.4687304e-01 5.4175144e-01 1.4481280e-02 2.7219884e+00\n 9.2223835e-01 2.8438425e+00 1.0885626e+00 -1.1035060e+00\n 6.2061220e-01 2.4854951e-02 8.0410810e-03 -1.6882117e-03\n -6.8704365e-04 5.2855094e-03 5.3451140e-03 1.0791669e-02\n -1.1036633e-02 -9.5606223e-03 -2.2516260e-03]\n [ 9.5316029e-01 8.4950799e-01 5.4304302e-01 3.1372786e-01\n 2.6947525e-01 -1.0903451e-02 -1.0200226e+00 -5.4784912e-01\n -9.6788669e-01 2.4767596e-02 8.9907618e-03 -1.5657196e-03\n -1.3686493e-03 5.5901231e-03 3.0851949e-03 1.1727927e-02\n -7.5357163e-04 -3.2297205e-03 -2.9447617e-03]]"
|
27 |
+
},
|
28 |
+
"_last_episode_starts": {
|
29 |
+
":type:": "<class 'numpy.ndarray'>",
|
30 |
+
":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="
|
31 |
+
},
|
32 |
+
"_last_original_obs": {
|
33 |
+
":type:": "<class 'collections.OrderedDict'>",
|
34 |
+
":serialized:": "gAWViwIAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAlQjZPU80bD1hwaM8DV8wvWtmiD1hwaM8TF7IvQADXz2ZwaM8iflFvT4nsL3Qv6M8lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAYS29vSuZ6j0K16M8f9cjvU19rb0K16M8U2+wvYG3pToK16M81r4Fvs4z0T2DTrs8lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWMAEAAAAAAADoL7K+uOxlPvHVdT49qCO+6vLXPYroXz68y/c5lQjZPU80bD1hwaM8NIliNyXybrdFdtS5khDFtzfAqLd08mwt7A5bMjWtZzKK8RO6Z1f/vTCkRz4jdUY+JGUTvgVGQj6hVaK6N9yDNQ1fML1rZog9YcGjPGz0brcNh2I3i9LIOZDAqDdTEcU3TJhsLVyuZzKpE1sy7/ITOq/NzjzDknM9BUdkPgLLJD+9i2c+HFJnPxVroT1MXsi9AANfPZnBozwRa5o3qRerNqhHjTdOFeC3dbItOIlBrLdyi/O64licumv4DjnPIiE+hO8hPiAMpz4jDSo7UasFPQJ4ejxJeoc1iflFvT4nsL3Qv6M8ONiMOE46GzcHMH24FrKpt0LuF7bQRVeslyZRL6kWWi4sf/u4lGgOSwRLE4aUaBJ0lFKUdS4=",
|
35 |
+
"achieved_goal": "[[ 0.1059734 0.05766707 0.01998967]\n [-0.0430594 0.0666016 0.01998967]\n [-0.09783611 0.05444622 0.01998978]\n [-0.04833368 -0.08601235 0.01998892]]",
|
36 |
+
"desired_goal": "[[-0.09237171 0.11454996 0.02 ]\n [-0.04000043 -0.08471165 0.02 ]\n [-0.08614983 0.00126432 0.02 ]\n [-0.1306108 0.10214959 0.02286459]]",
|
37 |
+
"observation": "[[-3.48021746e-01 2.24535823e-01 2.40073934e-01 -1.59821466e-01\n 1.05443791e-01 2.18660504e-01 4.72633052e-04 1.05973400e-01\n 5.76670729e-02 1.99896712e-02 1.35025948e-05 -1.42422841e-05\n -4.05239087e-04 -2.34919462e-05 -2.01166677e-05 1.34688823e-11\n 1.27508706e-08 1.34853524e-08 -5.64359711e-04]\n [-1.24678425e-01 1.94962263e-01 1.93806216e-01 -1.43940508e-01\n 1.89720228e-01 -1.23851385e-03 9.82435154e-07 -4.30593975e-02\n 6.66015968e-02 1.99896712e-02 -1.42428144e-05 1.35020937e-05\n 3.83038394e-04 2.01168295e-05 2.34922973e-05 1.34488636e-11\n 1.34856144e-08 1.27519479e-08 5.64380491e-04]\n [ 2.52445620e-02 5.94661348e-02 2.22927168e-01 6.43722653e-01\n 2.26118997e-01 9.03596640e-01 7.88175240e-02 -9.78361070e-02\n 5.44462204e-02 1.99897755e-02 1.84080873e-05 5.09895153e-06\n 1.68418774e-05 -2.67128016e-05 4.14126152e-05 -2.05345150e-05\n -1.85809867e-03 -1.19283446e-03 1.36347182e-04]\n [ 1.57359347e-01 1.58140242e-01 3.26264381e-01 2.59477715e-03\n 3.26340832e-02 1.52874012e-02 1.00938735e-06 -4.83336784e-02\n -8.60123485e-02 1.99889243e-02 6.71599410e-05 9.25229506e-06\n -6.03646295e-05 -2.02292977e-05 -2.26394377e-06 -3.05920914e-12\n 1.90221491e-10 4.95875875e-11 -1.19923003e-04]]"
|
38 |
+
},
|
39 |
+
"_episode_num": 20659,
|
40 |
+
"use_sde": false,
|
41 |
+
"sde_sample_freq": -1,
|
42 |
+
"_current_progress_remaining": 0.0,
|
43 |
+
"_stats_window_size": 100,
|
44 |
+
"ep_info_buffer": {
|
45 |
+
":type:": "<class 'collections.deque'>",
|
46 |
+
":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwCpA44p+c6OMAWyUSzKMAXSUR0DJIOPStvGZdX2UKGgGR8AmxCYTj/+9aAdLMmgIR0DJIebeoDPodX2UKGgGR8ASDO1OTJQtaAdLMmgIR0DJIdzMJQchdX2UKGgGR8AjoCLdepn6aAdLMmgIR0DJIb6C17Y1dX2UKGgGR8Am7kwN9YwJaAdLMmgIR0DJIkMzGgjAdX2UKGgGR8Akl68g6ltTaAdLMmgIR0DJI7bMkhRqdX2UKGgGR7+Y9kjHGS6laAdLAWgIR0DJI8HozN2UdX2UKGgGR8AmYCCBf8dgaAdLMmgIR0DJI7Km2sq8dX2UKGgGR8AprP2wmmcfaAdLMmgIR0DJI5ThNucddX2UKGgGR8Amm33Hq/ucaAdLMmgIR0DJJAVJQLuydX2UKGgGR8AjJLgXMyJsaAdLMmgIR0DJJRHOKO1fdX2UKGgGR8Aqx1mrbQC0aAdLMmgIR0DJJQBu89OidX2UKGgGR8AtaO6unuRcaAdLMmgIR0DJJOJvUBn0dX2UKGgGR7+dI065oXbeaAdLAWgIR0DJJOt3B55adX2UKGgGR8AjlNcGC7K8aAdLMmgIR0DJJVFE7W/bdX2UKGgGR8Arpyc0+C9RaAdLMmgIR0DJJlyTOgQIdX2UKGgGR8AYxweeWfK7aAdLMmgIR0DJJkstTUAldX2UKGgGR8Aw719fCyhSaAdLMmgIR0DJJjX7zkIYdX2UKGgGR8AsYmpEQXhwaAdLMmgIR0DJJp4GOdXldX2UKGgGR8AiGP9UCJXRaAdLMmgIR0DJJ6XB1s+FdX2UKGgGR8AsR+yZ8a4uaAdLMmgIR0DJJ5Rwjt5VdX2UKGgGR8ArAF8ohIOIaAdLMmgIR0DJJ332IwdsdX2UKGgGR8AUSgdwNsnBaAdLMmgIR0DJJ+YeA/cGdX2UKGgGR8Aqq8zQ/oq1aAdLMmgIR0DJKQX7JnxsdX2UKGgGR8AkFjoZAIIGaAdLMmgIR0DJKPalxffGdX2UKGgGR8AqL8gpz90jaAdLMmgIR0DJKOkvsZ5zdX2UKGgGR8AHj9Q40dilaAdLMmgIR0DJKXDtXxOMdX2UKGgGR8An81ZTyauwaAdLMmgIR0DJKqplUZNxdX2UKGgGR8Apcxzq8lHCaAdLMmgIR0DJKpkxASnMdX2UKGgGR8AohDm8ujASaAdLMmgIR0DJKoOXXyy2dX2UKGgGR8ApXWattALRaAdLMmgIR0DJKuscABDHdX2UKGgGR8AtVOgxrSE2aAdLMmgIR0DJK/V6gM+edX2UKGgGR8AmBLJ0W/JvaAdLMmgIR0DJK+QUUO/ddX2UKGgGR8AtDX1anrIHaAdLMmgIR0DJK85At4A0dX2UKGgGR8AjsurZJ04jaAdLMmgIR0DJLDXz19ORdX2UKGgGR8ArC4vvjOs1aAdLMmgIR0DJLUHbKzRhdX2UKGgGR8ApjRUFSsKcaAdLMmgIR0DJLTB8D0UXdX2UKGgGR8ATlf9gnc+JaAdLMmgIR0DJLRrGPxQSdX2UKGgGR7+Xy/bj94u9aAdLAWgIR0DJLSEDGLk0dX2UKGgGR8AkwhC+lCTmaAdLMmgIR0DJLYIVqN6xdX2UKGgGR8Afm/L1VYITaAdLMmgIR0DJLoweq7yydX2UKGgGR8AFyydFvybyaAdLMmgIR0DJLnuzfJmvdX2UKGgGR8AatNN8E3bVaAdLMmgIR0DJLmoz+FURdX2UKGgGR8AiUiBXjlxPaAdLMmgIR0DJLso2CNCJdX2UKGgGR8AxouYQarFPaAdLMmgIR0DJMBDh1klNdX2UKGgGR8AoqlpoK2KEaAdLMmgIR0DJMALgCOm0dX2UKGgGR8AZBY4hllK9aAdLMmgIR0DJL/6UmlZYdX2UKGgGR8AQwe6qbSZ0aAdLMmgIR0DJMH+0AtFsdX2UKGgGR8AqkrBj4HopaAdLMmgIR0DJMZObZvkzdX2UKGgGR8Ah1fZ26kIpaAdLMmgIR0DJMYN5Sm65dX2UKGgGR8Apaskpqh11aAdLMmgIR0DJMXgNVinYdX2UKGgGR8AlYbXpW3jNaAdLMmgIR0DJMdlM495hdX2UKGgGR8AlPuP3i704aAdLMmgIR0DJMuOdCmdidX2UKGgGR8Aj6eGO+7DmaAdLMmgIR0DJMtPMOf/WdX2UKGgGR8Aj/LwF1SwXaAdLMmgIR0DJMsM8NhE0dX2UKGgGR8AnOywfQrtmaAdLMmgIR0DJMybBhx5tdX2UKGgGR8AjeBg/keZHaAdLMmgIR0DJNC8yBTXKdX2UKGgGR8AqqE+xGDtgaAdLMmgIR0DJNB/9aUzLdX2UKGgGR8AlM3UhFEy+aAdLMmgIR0DJNA9Q0oBrdX2UKGgGR8AiBM2WIGhVaAdLMmgIR0DJNHMzXSSedX2UKGgGR8ArI7ihnJ1aaAdLMmgIR0DJNX316E8JdX2UKGgGR8AQy0v4/NaAaAdLMmgIR0DJNW19YwIudX2UKGgGR8AmCqo60Y0maAdLMmgIR0DJNVyZF5OadX2UKGgGR8AlXhky1uzhaAdLMmgIR0DJNc5sfq5cdX2UKGgGR8AtPJMg2ZRbaAdLMmgIR0DJNzQVCXyBdX2UKGgGR8AhqRh+fAbiaAdLMmgIR0DJNyOy/sVtdX2UKGgGR8AoNiS7oSteaAdLMmgIR0DJNxMmOU+tdX2UKGgGR8AmnSkTHsC1aAdLMmgIR0DJN3N1dPcjdX2UKGgGR8AcvRb8m8dxaAdLMmgIR0DJOH87MgU2dX2UKGgGR8AwOz9jwx33aAdLMmgIR0DJOG675Ec9dX2UKGgGR8AsffP5YYBOaAdLMmgIR0DJOF3Qtz0ZdX2UKGgGR8AZDub7TDwZaAdLMmgIR0DJOL/aL4vfdX2UKGgGR8AkR2fTTfBOaAdLMmgIR0DJOcs9IPK/dX2UKGgGR8AnXJK8L8aXaAdLMmgIR0DJObsSTQmedX2UKGgGR8Am13xFy7wsaAdLMmgIR0DJOatKNAC5dX2UKGgGR8Ao1eGfwqiHaAdLMmgIR0DJOg7U1AJLdX2UKGgGR8AY4z41xbSraAdLMmgIR0DJOxynHeabdX2UKGgGR8AVJBhQWN3oaAdLMmgIR0DJOwyc5Ke1dX2UKGgGR8AmTgxagVXWaAdLMmgIR0DJOvxfShJzdX2UKGgGR8Af3VTaTOgQaAdLMmgIR0DJO2FoWYWtdX2UKGgGR8AaiGFi8WbgaAdLMmgIR0DJPIkxREWqdX2UKGgGR8AbuLQ5WBBiaAdLMmgIR0DJPHvo5ggHdX2UKGgGR8AqfH4oJAt4aAdLMmgIR0DJPHVhoduHdX2UKGgGR8AtRWdVea8ZaAdLMmgIR0DJPPPqAz55dX2UKGgGR8AoX8CxNZeSaAdLMmgIR0DJPiNyFPBSdX2UKGgGR8AmVJqZc9nsaAdLMmgIR0DJPhNK9PDYdX2UKGgGR8AeI7uDzyz5aAdLMmgIR0DJPgJsGgSOdX2UKGgGR8AkiWcjJMg2aAdLMmgIR0DJPmQiNbTudX2UKGgGR8AhsDrZ8KG+aAdLMmgIR0DJP2rYmLLqdX2UKGgGR8AbTLHMlkYoaAdLMmgIR0DJP1q5PM0QdX2UKGgGR8AooVvddmg8aAdLMmgIR0DJP0lCRfWudX2UKGgGR8ApYixmkFfRaAdLMmgIR0DJP6pY9xIbdX2UKGgGR8AUzypaRp1zaAdLMmgIR0DJQLTgflp5dX2UKGgGR8Au4LJCBwuNaAdLMmgIR0DJQKWFg2IgdX2UKGgGR8AZ/zQNTcZcaAdLMmgIR0DJQJYVKwpwdX2UKGgGR8AYtkd3jdYXaAdLMmgIR0DJQPmyE+PjdX2UKGgGR8Aj15kbxVhkaAdLMmgIR0DJQgK5y2hJdX2UKGgGR8AbgBmwqy4XaAdLMmgIR0DJQfMuJ1q4dX2UKGgGR8AqSSXdCVrzaAdLMmgIR0DJQeKvcJt0dX2UKGgGR8AkARlpXZGsaAdLMmgIR0DJQkPcQAdXdWUu"
|
47 |
+
},
|
48 |
+
"ep_success_buffer": {
|
49 |
+
":type:": "<class 'collections.deque'>",
|
50 |
+
":serialized:": "gAWVhgAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKImJiYmJiYiJiYmJiYmIiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiImJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYmJiYllLg=="
|
51 |
+
},
|
52 |
+
"_n_updates": 249975,
|
53 |
+
"buffer_size": 1000000,
|
54 |
+
"batch_size": 256,
|
55 |
+
"learning_starts": 100,
|
56 |
+
"tau": 0.005,
|
57 |
+
"gamma": 0.99,
|
58 |
+
"gradient_steps": 1,
|
59 |
+
"optimize_memory_usage": false,
|
60 |
+
"replay_buffer_class": {
|
61 |
+
":type:": "<class 'abc.ABCMeta'>",
|
62 |
+
":serialized:": "gAWVOQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwQRGljdFJlcGxheUJ1ZmZlcpSTlC4=",
|
63 |
+
"__module__": "stable_baselines3.common.buffers",
|
64 |
+
"__annotations__": "{'observation_space': <class 'gymnasium.spaces.dict.Dict'>, 'obs_shape': typing.Dict[str, typing.Tuple[int, ...]], 'observations': typing.Dict[str, numpy.ndarray], 'next_observations': typing.Dict[str, numpy.ndarray]}",
|
65 |
+
"__doc__": "\n Dict Replay buffer used in off-policy algorithms like SAC/TD3.\n Extends the ReplayBuffer to use dictionary observations\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n Disabled for now (see https://github.com/DLR-RM/stable-baselines3/pull/243#discussion_r531535702)\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
66 |
+
"__init__": "<function DictReplayBuffer.__init__ at 0x79f7babf30a0>",
|
67 |
+
"add": "<function DictReplayBuffer.add at 0x79f7babf3130>",
|
68 |
+
"sample": "<function DictReplayBuffer.sample at 0x79f7babf31c0>",
|
69 |
+
"_get_samples": "<function DictReplayBuffer._get_samples at 0x79f7babf3250>",
|
70 |
+
"__abstractmethods__": "frozenset()",
|
71 |
+
"_abc_impl": "<_abc._abc_data object at 0x79f7ba918a00>"
|
72 |
+
},
|
73 |
+
"replay_buffer_kwargs": {},
|
74 |
+
"train_freq": {
|
75 |
+
":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>",
|
76 |
+
":serialized:": "gAWVYQAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLAWgAjBJUcmFpbkZyZXF1ZW5jeVVuaXSUk5SMBHN0ZXCUhZRSlIaUgZQu"
|
77 |
+
},
|
78 |
+
"use_sde_at_warmup": false,
|
79 |
+
"policy_delay": 2,
|
80 |
+
"target_noise_clip": 0.5,
|
81 |
+
"target_policy_noise": 0.2,
|
82 |
+
"observation_space": {
|
83 |
+
":type:": "<class 'gymnasium.spaces.dict.Dict'>",
|
84 |
+
":serialized:": "gAWVMgQAAAAAAACMFWd5bW5hc2l1bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwUZ3ltbmFzaXVtLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowNYm91bmRlZF9iZWxvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYDAAAAAAAAAAEBAZRoE4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoHCiWAwAAAAAAAAABAQGUaCBLA4WUaCR0lFKUjAZfc2hhcGWUSwOFlIwDbG93lGgcKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFksDhZRoJHSUUpSMBGhpZ2iUaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlIwIbG93X3JlcHKUjAUtMTAuMJSMCWhpZ2hfcmVwcpSMBDEwLjCUjApfbnBfcmFuZG9tlE51YowMZGVzaXJlZF9nb2FslGgNKYGUfZQoaBBoFmgZaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgnaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgsSwOFlGguaBwolgwAAAAAAAAAAAAgwQAAIMEAACDBlGgWSwOFlGgkdJRSlGgzaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgWaBloHCiWEwAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBlGggSxOFlGgkdJRSlGgnaBwolhMAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAZRoIEsThZRoJHSUUpRoLEsThZRoLmgcKJZMAAAAAAAAAAAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBZLE4WUaCR0lFKUaDNoHCiWTAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBAAAgQQAAIEEAACBBlGgWSxOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YnVoLE5oEE5oPE51Yi4=",
|
85 |
+
"spaces": "OrderedDict([('achieved_goal', Box(-10.0, 10.0, (3,), float32)), ('desired_goal', Box(-10.0, 10.0, (3,), float32)), ('observation', Box(-10.0, 10.0, (19,), float32))])",
|
86 |
+
"_shape": null,
|
87 |
+
"dtype": null,
|
88 |
+
"_np_random": null
|
89 |
+
},
|
90 |
+
"action_space": {
|
91 |
+
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
92 |
+
":serialized:": "gAWVagIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBBfX2dlbmVyYXRvcl9jdG9ylJOUjAVQQ0c2NJRoMowUX19iaXRfZ2VuZXJhdG9yX2N0b3KUk5SGlFKUfZQojA1iaXRfZ2VuZXJhdG9ylIwFUENHNjSUjAVzdGF0ZZR9lChoPYoPgXom1R9zzxD9XYahopU7jANpbmOUihGJcbERIt8/Sc65c8qJGHiiAHWMCmhhc191aW50MzKUSwCMCHVpbnRlZ2VylEsAdWJ1Yi4=",
|
93 |
+
"dtype": "float32",
|
94 |
+
"bounded_below": "[ True True True True]",
|
95 |
+
"bounded_above": "[ True True True True]",
|
96 |
+
"_shape": [
|
97 |
+
4
|
98 |
+
],
|
99 |
+
"low": "[-1. -1. -1. -1.]",
|
100 |
+
"high": "[1. 1. 1. 1.]",
|
101 |
+
"low_repr": "-1.0",
|
102 |
+
"high_repr": "1.0",
|
103 |
+
"_np_random": "Generator(PCG64)"
|
104 |
+
},
|
105 |
+
"n_envs": 4,
|
106 |
+
"lr_schedule": {
|
107 |
+
":type:": "<class 'function'>",
|
108 |
+
":serialized:": "gAWVoAMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0sTQwx0AIgAfACDAYMBUwCUToWUjAVmbG9hdJSFlIwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwIPGxhbWJkYT6US2FDAgwAlIwOdmFsdWVfc2NoZWR1bGWUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxJL3Vzci9sb2NhbC9saWIvcHl0aG9uMy4xMC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGghfZR9lChoGGgPjAxfX3F1YWxuYW1lX1+UjCFnZXRfc2NoZWR1bGVfZm4uPGxvY2Fscz4uPGxhbWJkYT6UjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgZjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOUaAIoaAcoSwFLAEsASwFLAUsTQwSIAFMAlGgJKYwBX5SFlGgOjARmdW5jlEuFQwIEAZSMA3ZhbJSFlCl0lFKUaBVOTmgdKVKUhZR0lFKUaCRoPn2UfZQoaBhoNWgnjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlGgpfZRoK05oLE5oLWgZaC5OaC9oMUc/UGJN0vGp/IWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwhZRSlIWUaEZdlGhIfZR1hpSGUjAu"
|
109 |
+
},
|
110 |
+
"actor_batch_norm_stats": [],
|
111 |
+
"critic_batch_norm_stats": [],
|
112 |
+
"actor_batch_norm_stats_target": [],
|
113 |
+
"critic_batch_norm_stats_target": []
|
114 |
+
}
|
td3-PandaPickAndPlaceDense-v3/policy.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5545cd751f37d2571862fc34ad2b7f8c7b53cb056b0e45412e92163de8efc125
|
3 |
+
size 3189802
|
td3-PandaPickAndPlaceDense-v3/pytorch_variables.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c35cea3b2e60fb5e7e162d3592df775cd400e575a31c72f359fb9e654ab00c5
|
3 |
+
size 864
|
td3-PandaPickAndPlaceDense-v3/system_info.txt
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
- OS: Linux-6.1.85+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sun Apr 28 14:29:16 UTC 2024
|
2 |
+
- Python: 3.10.12
|
3 |
+
- Stable-Baselines3: 2.3.2
|
4 |
+
- PyTorch: 2.3.0+cu121
|
5 |
+
- GPU Enabled: False
|
6 |
+
- Numpy: 1.25.2
|
7 |
+
- Cloudpickle: 2.2.1
|
8 |
+
- Gymnasium: 0.29.1
|
9 |
+
- OpenAI Gym: 0.25.2
|
vec_normalize.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4b78ab02cde81acdae2e1277344781918365c91ce1911001748479abb8ed7fb
|
3 |
+
size 3247
|