Commit
·
d2fdf01
1
Parent(s):
5813b5c
Initial commit
Browse files- README.md +2 -3
- args.yml +1 -1
- config.yml +0 -2
- replay.mp4 +2 -2
- results.json +1 -1
- tqc-LiftCube-v0.zip +2 -2
- tqc-LiftCube-v0/actor.optimizer.pth +1 -1
- tqc-LiftCube-v0/critic.optimizer.pth +1 -1
- tqc-LiftCube-v0/data +17 -17
- tqc-LiftCube-v0/ent_coef_optimizer.pth +1 -1
- tqc-LiftCube-v0/policy.pth +1 -1
- tqc-LiftCube-v0/pytorch_variables.pth +1 -1
- train_eval_metrics.zip +2 -2
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: LiftCube-v0
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value: -96.
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
@@ -64,10 +64,9 @@ python -m rl_zoo3.push_to_hub --algo tqc --env LiftCube-v0 -f logs/ -orga qgallo
|
|
64 |
```python
|
65 |
OrderedDict([('n_envs', 48),
|
66 |
('n_timesteps', 10000000.0),
|
67 |
-
('normalize', True),
|
68 |
('policy', 'MultiInputPolicy'),
|
69 |
('use_sde', True),
|
70 |
-
('
|
71 |
```
|
72 |
|
73 |
# Environment Arguments
|
|
|
16 |
type: LiftCube-v0
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: -96.99 +/- 0.13
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
64 |
```python
|
65 |
OrderedDict([('n_envs', 48),
|
66 |
('n_timesteps', 10000000.0),
|
|
|
67 |
('policy', 'MultiInputPolicy'),
|
68 |
('use_sde', True),
|
69 |
+
('normalize', False)])
|
70 |
```
|
71 |
|
72 |
# Environment Arguments
|
args.yml
CHANGED
@@ -56,7 +56,7 @@
|
|
56 |
- - save_replay_buffer
|
57 |
- false
|
58 |
- - seed
|
59 |
-
-
|
60 |
- - storage
|
61 |
- null
|
62 |
- - study_name
|
|
|
56 |
- - save_replay_buffer
|
57 |
- false
|
58 |
- - seed
|
59 |
+
- 2024069831
|
60 |
- - storage
|
61 |
- null
|
62 |
- - study_name
|
config.yml
CHANGED
@@ -3,8 +3,6 @@
|
|
3 |
- 48
|
4 |
- - n_timesteps
|
5 |
- 10000000.0
|
6 |
-
- - normalize
|
7 |
-
- true
|
8 |
- - policy
|
9 |
- MultiInputPolicy
|
10 |
- - use_sde
|
|
|
3 |
- 48
|
4 |
- - n_timesteps
|
5 |
- 10000000.0
|
|
|
|
|
6 |
- - policy
|
7 |
- MultiInputPolicy
|
8 |
- - use_sde
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:920d3f5b3dcb9571d988605d6484e4744637ae3ac6c560a89e098716d669a5b6
|
3 |
+
size 553134
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward": -96.
|
|
|
1 |
+
{"mean_reward": -96.98540720000001, "std_reward": 0.13347970467512954, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-06-09T00:29:27.305653"}
|
tqc-LiftCube-v0.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32e206e0ea4c82c1e48caad6d29e4f63ffc09435f70c23926b74245aaaa54397
|
3 |
+
size 3429724
|
tqc-LiftCube-v0/actor.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 589975
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4cc4ed13b9a6c6677006468cf2b775ad3861fe0071cf6ad5ad492c2d8fb844b
|
3 |
size 589975
|
tqc-LiftCube-v0/critic.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1255594
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:524d6e09ce30632b08a04bedea90b708a837f23e027787e79bbe5dd2fd88085c
|
3 |
size 1255594
|
tqc-LiftCube-v0/data
CHANGED
@@ -4,20 +4,20 @@
|
|
4 |
":serialized:": "gAWVMQAAAAAAAACMGHNiM19jb250cmliLnRxYy5wb2xpY2llc5SMEE11bHRpSW5wdXRQb2xpY3mUk5Qu",
|
5 |
"__module__": "sb3_contrib.tqc.policies",
|
6 |
"__doc__": "\n Policy class (with both actor and critic) for TQC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_quantiles: Number of quantiles for the critic.\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
|
7 |
-
"__init__": "<function MultiInputPolicy.__init__ at
|
8 |
"__abstractmethods__": "frozenset()",
|
9 |
-
"_abc_impl": "<_abc._abc_data object at
|
10 |
},
|
11 |
"verbose": 1,
|
12 |
"policy_kwargs": {
|
13 |
"use_sde": true
|
14 |
},
|
15 |
-
"num_timesteps":
|
16 |
"_total_timesteps": 10000000,
|
17 |
"_num_timesteps_at_start": 0,
|
18 |
"seed": 0,
|
19 |
"action_noise": null,
|
20 |
-
"start_time":
|
21 |
"learning_rate": 0.0003,
|
22 |
"tensorboard_log": null,
|
23 |
"_last_obs": null,
|
@@ -27,25 +27,25 @@
|
|
27 |
},
|
28 |
"_last_original_obs": {
|
29 |
":type:": "<class 'collections.OrderedDict'>",
|
30 |
-
":serialized:": "
|
31 |
-
"arm_qpos": "[[
|
32 |
-
"arm_qvel": "[[
|
33 |
-
"cube_pos": "[[
|
34 |
},
|
35 |
-
"_episode_num":
|
36 |
"use_sde": true,
|
37 |
"sde_sample_freq": -1,
|
38 |
-
"_current_progress_remaining": 0.
|
39 |
"_stats_window_size": 100,
|
40 |
"ep_info_buffer": {
|
41 |
":type:": "<class 'collections.deque'>",
|
42 |
-
":serialized:": "
|
43 |
},
|
44 |
"ep_success_buffer": {
|
45 |
":type:": "<class 'collections.deque'>",
|
46 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
47 |
},
|
48 |
-
"_n_updates":
|
49 |
"observation_space": {
|
50 |
":type:": "<class 'gymnasium.spaces.dict.Dict'>",
|
51 |
":serialized:": "gAWVzAMAAAAAAACMFWd5bW5hc2l1bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojAhhcm1fcXBvc5SMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBgAAAAAAAAABAQEBAQGUaBOMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBoWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBwolgYAAAAAAAAAAQEBAQEBlGggSwaFlGgkdJRSlIwGX3NoYXBllEsGhZSMA2xvd5RoHCiWGAAAAAAAAADbD0nA2w9JwNsPScDbD0nA2w9JwNsPScCUaBZLBoWUaCR0lFKUjARoaWdolGgcKJYYAAAAAAAAANsPSUDbD0lA2w9JQNsPSUDbD0lA2w9JQJRoFksGhZRoJHSUUpSMCGxvd19yZXBylIwKLTMuMTQxNTkyN5SMCWhpZ2hfcmVwcpSMCTMuMTQxNTkyN5SMCl9ucF9yYW5kb22UTnVijAhhcm1fcXZlbJRoDSmBlH2UKGgQaBZoGWgcKJYGAAAAAAAAAAEBAQEBAZRoIEsGhZRoJHSUUpRoJ2gcKJYGAAAAAAAAAAEBAQEBAZRoIEsGhZRoJHSUUpRoLEsGhZRoLmgcKJYYAAAAAAAAAAAAIMEAACDBAAAgwQAAIMEAACDBAAAgwZRoFksGhZRoJHSUUpRoM2gcKJYYAAAAAAAAAAAAIEEAACBBAAAgQQAAIEEAACBBAAAgQZRoFksGhZRoJHSUUpRoOIwFLTEwLjCUaDqMBDEwLjCUaDxOdWKMCGN1YmVfcG9zlGgNKYGUfZQoaBBoFmgZaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgnaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgsSwOFlGguaBwolgwAAAAAAAAAAAAgwQAAIMEAACDBlGgWSwOFlGgkdJRSlGgzaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YnVoLE5oEE5oPE51Yi4=",
|
@@ -83,12 +83,12 @@
|
|
83 |
"__module__": "stable_baselines3.common.buffers",
|
84 |
"__annotations__": "{'observation_space': <class 'gymnasium.spaces.dict.Dict'>, 'obs_shape': typing.Dict[str, typing.Tuple[int, ...]], 'observations': typing.Dict[str, numpy.ndarray], 'next_observations': typing.Dict[str, numpy.ndarray]}",
|
85 |
"__doc__": "\n Dict Replay buffer used in off-policy algorithms like SAC/TD3.\n Extends the ReplayBuffer to use dictionary observations\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n Disabled for now (see https://github.com/DLR-RM/stable-baselines3/pull/243#discussion_r531535702)\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
86 |
-
"__init__": "<function DictReplayBuffer.__init__ at
|
87 |
-
"add": "<function DictReplayBuffer.add at
|
88 |
-
"sample": "<function DictReplayBuffer.sample at
|
89 |
-
"_get_samples": "<function DictReplayBuffer._get_samples at
|
90 |
"__abstractmethods__": "frozenset()",
|
91 |
-
"_abc_impl": "<_abc._abc_data object at
|
92 |
},
|
93 |
"replay_buffer_kwargs": {},
|
94 |
"train_freq": {
|
|
|
4 |
":serialized:": "gAWVMQAAAAAAAACMGHNiM19jb250cmliLnRxYy5wb2xpY2llc5SMEE11bHRpSW5wdXRQb2xpY3mUk5Qu",
|
5 |
"__module__": "sb3_contrib.tqc.policies",
|
6 |
"__doc__": "\n Policy class (with both actor and critic) for TQC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_quantiles: Number of quantiles for the critic.\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
|
7 |
+
"__init__": "<function MultiInputPolicy.__init__ at 0x7f4fa75ef370>",
|
8 |
"__abstractmethods__": "frozenset()",
|
9 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f4fa75fea80>"
|
10 |
},
|
11 |
"verbose": 1,
|
12 |
"policy_kwargs": {
|
13 |
"use_sde": true
|
14 |
},
|
15 |
+
"num_timesteps": 124800,
|
16 |
"_total_timesteps": 10000000,
|
17 |
"_num_timesteps_at_start": 0,
|
18 |
"seed": 0,
|
19 |
"action_noise": null,
|
20 |
+
"start_time": 1717892500259129213,
|
21 |
"learning_rate": 0.0003,
|
22 |
"tensorboard_log": null,
|
23 |
"_last_obs": null,
|
|
|
27 |
},
|
28 |
"_last_original_obs": {
|
29 |
":type:": "<class 'collections.OrderedDict'>",
|
30 |
+
":serialized:": "gAWVLwwAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojAhhcm1fcXBvc5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJaABAAAAAAAACVaD7762XM+q3p1PAAAgD/tQgYkguIfIsTFhD3IoXU+fWCKPDiKf7/5yFC9JCSDPMfwL72D/wo+q3p1PAAAgD+TpVojsWm+IhK8Ij362BU+q3p1PAAAgD/gle8jPy+sItYRaj1kSGw+q3p1PAAAgD834q8j3FY/IyNX8L0xaBI+q3p1PAAAgD/wn7QjubyLou5OlT1w4no+q3p1PAAAgD+2IQgkbB7ToT1uNr+VAVO/bcznPPIVf7/7K6O9qgrfvMo7BEHo9WDACSctPU5AH76zcg4862cmv7eDKMC0kThAQSVvPQIdeL9N3YU7jp5HPm+RQb2q6Sw+q3p1PAAAgD+8tcsjf5VJIrnzkz3I9lQ+q3p1PAAAgD8Lz9Ajuz6UIY6B1EAoG5TAjltiPZjWZb8RZga+QFgcvnJVEcG0hAPBJdCYPYR0FL/+xC8/77SjPgqrikBGemRCfSFfQpFpo75XOvY9qjY2P+CVmEBXUQzBGLksPXmVfj94ZpW9z+RFvU68oEEFALnALv5ZPnnhE77TBXa+S+Avv2YdxjtQp30+q3p1PAAAgD+mhvkjYP8NIp1bWb+aOwE/gUmcPLj/Tb+4ZVi91XeQvIr6rz1KxTU+q3p1PAAAgD+m/gwk+lA4nXoFgj3hNzc+q3p1PAAAgD9FPeEjDHoiIZCtC765PCs+q3p1PAAAgD+ZtwYkN3IOotRIKcAc6bk/cVxAPex9dD3Psxu/R48Iv1PTNb0E8B8+q3p1PAAAgD90aLEjDmMqIzOMkj0OAgU+q3p1PAAAgD+hlNYjCQ8RIw+wEr6R828+q5B2PJyRaD9DISI66wXBOmZ/N0Hw0FbBBehfPoOTez9w/O+9JiHxvGmwmDyJpls+q3p1PAAAgD+PCAsjqHOKJ/EXEr6GqPU9q3p1PAAAgD9OaMAjf0hwoTgFDEAvXzc/p7PRPMUtuDtzsMw+GpE/vwMKiEDWxTA/VN6YPHrTPz85hAk9z0mnvcsAL8H4bgg+c0moPbdJFr//Xo8826ZLvuwPDz4yEsk+DbKbPPCGfD8cqgO+rJGePWKlqb/hdq49xN8KP5P7RD/Vbty8qucCvzrWU0AxR7XA7lVePvpbND99uR0/x9+UvoF6sL3nO34+q3p1PAAAgD81/rEjmK3ComlFqr+P08e/W6UQP1U9PT/yeDq+4GQxvi7xMjzPx/I9q3p1PAAAgD++2/Eji2asooRt3b+ySrO/NmHJPMNPc7/iZDk+97lrvji4lsAVWIrAQm4BPQX/Zj9TYQA9ReN9vJsBmz1H1fQ9q3p1PAAAgD+kFwUkBAlvoUfS+bvwfyo+q3p1PAAAgD+BJu0jc+Mtosa/Wb/ztVs/dgLaPAfunj5s9zY/PTrIvpXHYUIuCaQ+re5iQf6kWb994E++QYSHPsI6xLtFAWU+kW6FPCxjfL8qhr67nNUXPkdeBT2smHw+q3p1PAAAgD9N0AskufZTH5kDuL1x/AQ+q3p1PAAAgD+ubLgjYXYzI/HaTD7/cJU+QzzHPDZyab9t9Z++p7JOPpSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLMEsGhpSMAUOUdJRSlIwIYXJtX3F2ZWyUaAcoloAEAAAAAAAAzczmpJqZkiQz4Bs21V5kpkofi6UrL6IkCcQ4Pk5gPj1IGCS+V30uwQKuEj9qLzPBl193o0WquCQz4Bs2MvrmpfQsg6ayihOlZmb6pDMzgyQz4Bs2tv57pQD/wqUXv7GjKIo4I0BYwCMz4Bs28dTlJQ5PYKZcTQqkzcxsIzMze6Mz4Bs2RA8PJUmvCyYzv5wj6diWpOFonSMz4Bs2VCEvpvE7ySXCWiGlqM3yv7KJ4795vhk+ZNZbwXscKEAsamxA9TClQRP9E8HLPza/OZLjP+FyQcJ4tlHCWqvRwLZPzUD02KC+XFTbP/d3MMFkH1VBzczII83MTKQz4Bs2FL2zplWjAqbRXmekmpkupQAAECUz4Bs2GPMwJlIfBab1VkulH5t6QU99QsHWuU09y2NIQEfbekAoKpLBOva1weGNqsHr0si//yUSQS3OkkCDmnDAuu4xQT6xD0Ol3gpDplCXwcfz38KtNMFCIG9CQRUqrcFrvLq+bNFBQUgDG0GlJ9bBj4ZCQlh+cMGlNANA/OJtQQ0dGkK8jBjCJswTJIoUKCMz4Bs20WYGpQ7iEybhIDakIWDovwephD+lzHM+XGmYwYv2ZsDlhgnDAADAIWZmhaQz4Bs2705QpiT/JyUQ/zakMzOPo83MzB8z4Bs2UgoFp0v/iSUU/7OjskuBIUUWc6Mz4Bs2LyGVplnp7aMQuF0jp9KhwGu9QkAq0IE/E7VRQUUfQUFaCjrB7EP/pPWYBSUz4Bs2/tuapTOGSaWBqLKkHWbjo4QRwyMz4Bs2fGcZpnAdR6bpAYKiCm/Eu90jlLwOUJ06BCTHvZtHPD6uEsQ/tMfmQbaRBcKmW+8+hBJLwZGovL8pP+jBYkTap15gjCQ34Bs2ZcLAJbcS4Krd0jCjzcwOJM3MvCIz4Bs2LymfpuH+2iQg56olXb6oQOy1wj+nVFW+a/bFwlp8N0MsggFDtd8iQcSqlT8+Tmi+WIz5wEWDAEEAoW5CI7nZwdDGPylHaLq/6e/9vkiSwr8pMDJBW5fWPuBIDj8iW4W9Sq7Jwb6OMUE9uHFBFG30wOABcL62Y/I/8Pqevm/SvMBz9ozAMhQGQaj6YcHyefu9IvNIwuD+tkEd74zBmpkFJJqZ6qQz4Bs2En+1JNOWZaY2vxkknGkHwQlzFMH4nV1ATsP1v+JWGsDBYgTBMzMVJM3MEiQz4Bs2AW/CpSPXqCXGbu+kJMlswA28cMAmhNy+dgIgQUjDHcGd6n7A49A3weChMsEauri+TP8CPwN8BT+ddgZAMzNbo83Mo6Q04Bs2235fpMY+byVXFwGlRpuEJHWjxSQz4Bs2NV3QpuSd+iQyBUckGuqmv6qTmD/53C8+sFmXQNxCCMC+q7W/bNwOQ8WifD5VSAdCRPomwkS1WULah6dChz5/vhIxDL0UfD0+0isbPq64eMHd4sA+AADYo2ZmpiIz4Bs2TzuHphT/M6I5D5gkZmb6o2Zm3qMz4Bs2zBJrpiE/KqRIV4yloXtPvnDRcb7LMTE+1ddSQVxCxcDpRMRAlGgOSzBLBoaUaBJ0lFKUjAhjdWJlX3Bvc5RoByiWQAIAAAAAAAC7nIoiFsK/v+49Nr8AV948IIbuvwWsn758Th8j63MKwHDeCb9dr/mibjP0vwD9Ar9fA4KjK/X4v1N4qL5E4Ziilwukvyhnrr5P1RmjTN/kvzIVAr9kOtG71GYhwFSeAL9ZaD6/ShHZv8lovb7eGRq+VDbVv6PAr77Snk0j8VDdv9M1Nr+WN48iRlkLwHhMxr1Oicg+pvAPwB8pNb+7ppm+q9wAwPAQH7+HMh2/pqXqvh++sr2KBm49APTiv5edKb8Hnys/wVgVwF8wDb8cY+iiE6b2v3GbC79sURe/RF79v9rTwr6F/KajDJyOv0dmO79J3++idhDuvz1iIb/aiLKgakS+v50yCL++sxU/xYDhv/lxJ7/vk/2hZB3avwSADb/XaNCilE+cvw7IB7+k/NU+AWVTv2OgUb5xmA++Y0fxvzpHE793jOYqXaAPwKbBnL4d1jQjzmDmv7hLBr9WgQe/Kii9v+ZV5L7BAii/y46RvzFoRz1x10g/apsDwPsXK7/uKog9zYYIwBcLbL5rc8O+dvXYv8E4OL+Cg0s+xaonwE1cFL9/634jGq4LwLoGgr158x+/Q7AwwDRykb4dIlQj3BPXv6dU4b4O0tW9RhLov7Jl/r4z+Ns+QIASwNGqLb8pwkqjSGKpvxh7n76sbbaiQhznv3zCBL8Axvq+sZvDv5bYub7AkNA+VsXqv0jo5b6Cs569I/bbv9I4BL9QgXMiqCGJv5dqkr61oaaiSb29vyubhL56oDG+g4sLwOQ3CL+UaA5LMEsDhpRoEnSUUpR1Lg==",
|
31 |
+
"arm_qpos": "[[-1.39992312e-01 2.38136202e-01 1.49828596e-02 1.00000000e+00\n 2.91133066e-17 2.16684304e-18]\n [ 6.48303330e-02 2.39874959e-01 1.68917123e-02 -9.98202801e-01\n -5.09729125e-02 1.60084441e-02]\n [-4.29542325e-02 1.35740325e-01 1.49828596e-02 1.00000000e+00\n 1.18528654e-17 5.16115083e-18]\n [ 3.97301391e-02 1.46335512e-01 1.49828596e-02 1.00000000e+00\n 2.59759065e-17 4.66707172e-18]\n [ 5.71459159e-02 2.30744898e-01 1.49828596e-02 1.00000000e+00\n 1.90693437e-17 1.03725239e-17]\n [-1.17353700e-01 1.42975584e-01 1.49828596e-02 1.00000000e+00\n 1.95833753e-17 -3.78758434e-18]\n [ 7.29044527e-02 2.45004416e-01 1.49828596e-02 1.00000000e+00\n 2.95188534e-17 -1.43059688e-18]\n [-7.12619603e-01 -8.24242890e-01 2.82957200e-02 -9.96428609e-01\n -7.96737298e-02 -2.72267647e-02]\n [ 8.26459694e+00 -3.51500893e+00 4.22735550e-02 -1.55518740e-01\n 8.69433861e-03 -6.50023162e-01]\n [-2.63303924e+00 2.88389301e+00 5.83851375e-02 -9.69192624e-01\n 4.08521900e-03 1.94940776e-01]\n [-4.72578369e-02 1.68860108e-01 1.49828596e-02 1.00000000e+00\n 2.20862716e-17 2.73197222e-18]\n [ 7.22422078e-02 2.07972646e-01 1.49828596e-02 1.00000000e+00\n 2.26390913e-17 1.00454747e-18]\n [ 6.64081478e+00 -4.62831497e+00 5.52630946e-02 -8.97805691e-01\n -1.31248727e-01 -1.52680397e-01]\n [-9.08336067e+00 -8.21989822e+00 7.46157542e-02 -5.79902887e-01\n 6.86599612e-01 3.19739789e-01]\n [ 4.33337879e+00 5.71194077e+01 5.57827034e+01 -3.19164783e-01\n 1.20228462e-01 7.11771607e-01]\n [ 4.76829529e+00 -8.76985836e+00 4.21687067e-02 9.94468272e-01\n -7.29493499e-02 -4.83139120e-02]\n [ 2.00919456e+01 -5.78125238e+00 2.12883681e-01 -1.44414797e-01\n -2.40256593e-01 -6.87016189e-01]\n [ 6.04598504e-03 2.47708559e-01 1.49828596e-02 1.00000000e+00\n 2.70536599e-17 1.92442577e-18]\n [-8.49054158e-01 5.04815698e-01 1.90780181e-02 -8.04683208e-01\n -5.28313816e-02 -1.76352654e-02]\n [ 8.59270841e-02 1.77510411e-01 1.49828596e-02 1.00000000e+00\n 3.05733564e-17 -2.43940611e-21]\n [ 6.34870082e-02 1.78924099e-01 1.49828596e-02 1.00000000e+00\n 2.44204975e-17 5.50492627e-19]\n [-1.36404276e-01 1.67223826e-01 1.49828596e-02 1.00000000e+00\n 2.92121315e-17 -1.93050534e-18]\n [-2.64507008e+00 1.45242643e+00 4.69631590e-02 5.96904010e-02\n -6.08212411e-01 -5.33436239e-01]\n [-4.43909876e-02 1.56189024e-01 1.49828596e-02 1.00000000e+00\n 1.92346161e-17 9.23669411e-18]\n [ 7.15564713e-02 1.29890651e-01 1.49828596e-02 1.00000000e+00\n 2.32648733e-17 7.86364957e-18]\n [-1.43249735e-01 2.34327570e-01 1.50491400e-02 9.08471823e-01\n 6.18476595e-04 1.47264951e-03]\n [ 1.14686031e+01 -1.34260101e+01 2.18658522e-01 9.82719600e-01\n -1.17180705e-01 -2.94347517e-02]\n [ 1.86388064e-02 2.14502469e-01 1.49828596e-02 1.00000000e+00\n 7.53701745e-18 3.84280891e-15]\n [-1.42669454e-01 1.19950339e-01 1.49828596e-02 1.00000000e+00\n 2.08608565e-17 -8.14111107e-19]\n [ 2.18781853e+00 7.16296136e-01 2.55983602e-02 5.62069053e-03\n 3.99783701e-01 -7.48307824e-01]\n [ 4.25122213e+00 6.90518737e-01 1.86607018e-02 7.49320626e-01\n 3.35733630e-02 -8.16837475e-02]\n [-1.09376936e+01 1.33235812e-01 8.21713433e-02 -5.87062299e-01\n 1.75013524e-02 -1.98878691e-01]\n [ 1.39709175e-01 3.92716944e-01 1.90057997e-02 9.86433983e-01\n -1.28578603e-01 7.74262846e-02]\n [-1.32535958e+00 8.51876810e-02 5.42476892e-01 7.69463718e-01\n -2.69083176e-02 -5.11347413e-01]\n [ 3.30995035e+00 -5.66494036e+00 2.17124671e-01 7.04528451e-01\n 6.16111577e-01 -2.90769786e-01]\n [-8.61711577e-02 2.48275384e-01 1.49828596e-02 1.00000000e+00\n 1.92980393e-17 -5.27676049e-18]\n [-1.33024323e+00 -1.56114376e+00 5.65023124e-01 7.39217103e-01\n -1.82101995e-01 -1.73236370e-01]\n [ 1.09217595e-02 1.18545167e-01 1.49828596e-02 1.00000000e+00\n 2.62223368e-17 -4.67292650e-18]\n [-1.72990465e+00 -1.40071702e+00 2.45824866e-02 -9.50435817e-01\n 1.81048900e-01 -2.30201587e-01]\n [-4.70998764e+00 -4.32325220e+00 3.15992907e-02 9.02328789e-01\n 3.13428156e-02 -1.54960798e-02]\n [ 7.56866559e-02 1.19547419e-01 1.49828596e-02 1.00000000e+00\n 2.88598022e-17 -8.09882818e-19]\n [-7.62394397e-03 1.66503668e-01 1.49828596e-02 1.00000000e+00\n 2.57118985e-17 -2.35662826e-18]\n [-8.50582480e-01 8.58245075e-01 2.66125016e-02 3.10409755e-01\n 7.14712858e-01 -3.91069323e-01]\n [ 5.64449043e+01 3.20382535e-01 1.41832705e+01 -8.50173831e-01\n -2.03004792e-01 2.64680892e-01]\n [-5.98844979e-03 2.23637655e-01 1.62880737e-02 -9.85888243e-01\n -5.81433345e-03 1.48275793e-01]\n [ 3.25606130e-02 2.46676147e-01 1.49828596e-02 1.00000000e+00\n 3.03172580e-17 4.48850722e-20]\n [-8.98506120e-02 1.29869238e-01 1.49828596e-02 1.00000000e+00\n 1.99953476e-17 9.72867715e-18]\n [ 2.00053945e-01 2.91877717e-01 2.43207272e-02 -9.11898971e-01\n -3.12419325e-01 2.01853380e-01]]",
|
32 |
+
"arm_qvel": "[[-1.00093546e-16 6.35776180e-17 2.32273010e-06 -7.92319119e-16\n -2.41338586e-16 7.03362064e-17]\n [ 1.80435315e-01 4.64785621e-02 -1.60248876e-01 -1.09056005e+01\n 5.72967649e-01 -1.11990757e+01]\n [-1.34101388e-17 8.00857277e-17 2.32273010e-06 -4.00681789e-16\n -9.10213558e-16 -1.27972093e-16]\n [-1.08593687e-16 5.68989287e-17 2.32273010e-06 -2.18570790e-16\n -3.38264302e-16 -1.92713081e-17]\n [ 1.00039157e-17 2.08540570e-17 2.32273010e-06 3.98694623e-16\n -7.78227508e-16 -2.99895059e-17]\n [ 1.28369539e-17 -1.36175791e-17 2.32273010e-06 1.24084450e-16\n 4.84628683e-16 1.69945299e-17]\n [-6.54195904e-17 1.70663921e-17 2.32273010e-06 -6.07604897e-16\n 3.49085597e-16 -1.39952739e-16]\n [-1.89690113e+00 -1.77763963e+00 1.50140658e-01 -1.37398415e+01\n 2.62673831e+00 3.69398022e+00]\n [ 2.06489048e+01 -9.24928570e+00 -7.11910903e-01 1.77789986e+00\n -4.83621864e+01 -5.24281921e+01]\n [-6.55216694e+00 6.41598034e+00 -3.14155221e-01 1.71351194e+00\n -1.10292883e+01 1.33201637e+01]\n [ 2.17707800e-17 -4.44089216e-17 2.32273010e-06 -1.24718698e-15\n -4.53241666e-16 -5.01704530e-17]\n [-1.51441365e-16 1.24900090e-16 2.32273010e-06 6.13917198e-16\n -4.61860914e-16 -1.76369055e-16]\n [ 1.56628714e+01 -1.21555929e+01 5.02260551e-02 3.13109088e+00\n 3.91963363e+00 -1.82705841e+01]\n [-2.27452278e+01 -2.13192768e+01 -1.56893671e+00 9.13427639e+00\n 4.58766794e+00 -3.75943065e+00]\n [ 1.11207829e+01 1.43692352e+02 1.38869705e+02 -1.89143791e+01\n -1.11976128e+02 9.66028824e+01]\n [ 1.21521301e+01 -2.16455479e+01 -3.64718765e-01 1.21136284e+01\n 9.68830109e+00 -2.67693577e+01]\n [ 4.86314049e+01 -1.50308456e+01 2.05008817e+00 1.48679161e+01\n 3.85283699e+01 -3.81374359e+01]\n [ 3.20484643e-17 9.11164756e-18 2.32273010e-06 -1.16574828e-16\n 5.13072314e-16 -3.94928086e-17]\n [-1.81543362e+00 1.03640831e+00 2.38085344e-01 -1.90514450e+01\n -3.60879779e+00 -1.37526932e+02]\n [ 1.30104261e-18 -5.78530253e-17 2.32273010e-06 -7.22714716e-16\n 1.45713860e-16 -3.96810054e-17]\n [-1.55257748e-17 8.67361751e-20 2.32273010e-06 -1.84630524e-15\n 2.39387049e-16 -1.95152487e-17]\n [ 8.76141640e-19 -1.31777722e-17 2.32273010e-06 -1.03479463e-15\n -2.57944181e-17 1.20194108e-17]\n [-5.05696440e+00 3.04281116e+00 1.01416516e+00 1.31067076e+01\n 1.20701342e+01 -1.16275272e+01]\n [-1.10703686e-16 1.15877350e-16 2.32273010e-06 -2.68638140e-16\n -1.74794394e-16 -7.74806514e-17]\n [-2.46546360e-17 2.11493605e-17 2.32273010e-06 -5.32227858e-16\n -6.90818896e-16 -3.52385931e-18]\n [-5.99468220e-03 -1.80835072e-02 1.20020076e-03 -9.72366631e-02\n 1.83866903e-01 1.53182006e+00]\n [ 2.88475113e+01 -3.33922958e+01 4.67496097e-01 -1.26920204e+01\n -1.47389424e+00 -2.90308399e+01]\n [-6.05812956e-15 6.08785740e-17 2.32273101e-06 3.34384176e-16\n -3.98033792e-13 -9.58563115e-18]\n [ 3.09648147e-17 5.11743434e-18 2.32273010e-06 -1.10440041e-15\n 9.49742111e-17 2.96469155e-16]\n [ 5.27323771e+00 1.52117682e+00 -2.08330736e-01 -9.89812851e+01\n 1.83485748e+02 1.29508484e+02]\n [ 1.01796160e+01 1.16927385e+00 -2.26860970e-01 -7.79838181e+00\n 8.03204823e+00 5.96572266e+01]\n [-2.72153988e+01 4.25829619e-14 -1.45630729e+00 -4.95970994e-01\n -1.52008915e+00 1.11367579e+01]\n [ 4.19123501e-01 5.55799484e-01 -6.51152283e-02 -2.52101021e+01\n 1.10973492e+01 1.51074800e+01]\n [-7.63831520e+00 -2.34382153e-01 1.89366794e+00 -3.10508251e-01\n -5.90068769e+00 -4.40508413e+00]\n [ 8.37993050e+00 -1.41236954e+01 -1.22791186e-01 -5.02374344e+01\n 2.28744507e+01 -1.76167545e+01]\n [ 2.89698834e-17 -1.01741535e-16 2.32273010e-06 7.87115028e-17\n -7.96547401e-16 3.33385484e-17]\n [-8.46328354e+00 -9.27808475e+00 3.46276665e+00 -1.92002273e+00\n -2.41155291e+00 -8.27410984e+00]\n [ 3.23525922e-17 3.18321764e-17 2.32273010e-06 -3.37288546e-16\n 2.92891367e-16 -1.03837385e-16]\n [-3.69977665e+00 -3.76147771e+00 -4.30695713e-01 1.00006008e+01\n -9.86017609e+00 -3.98306966e+00]\n [-1.14884977e+01 -1.11645203e+01 -3.60794842e-01 5.11708021e-01\n 5.21423519e-01 2.10098958e+00]\n [-1.18828556e-17 -7.10369277e-17 2.32273032e-06 -4.84628677e-17\n 2.07512140e-16 -1.11968743e-16]\n [ 5.75089181e-17 8.57120382e-17 2.32273010e-06 -1.44581631e-15\n 1.08687694e-16 4.31556471e-17]\n [-1.30401921e+00 1.19200635e+00 1.71741381e-01 4.72969818e+00\n -2.12908077e+00 -1.41930366e+00]\n [ 1.42861023e+02 2.46714666e-01 3.38206367e+01 -4.17444000e+01\n 5.44270172e+01 8.37653351e+01]\n [-2.49261960e-01 -3.42264846e-02 1.85043633e-01 1.51534349e-01\n -1.55450878e+01 3.76730829e-01]\n [-2.34187669e-17 4.51028087e-18 2.32273010e-06 -9.38358240e-16\n -2.43940608e-18 6.59452803e-17]\n [-2.71484217e-17 -2.41126557e-17 2.32273010e-06 -8.15574779e-16\n -3.69163461e-17 -2.43452727e-16]\n [-2.02620044e-01 -2.36150503e-01 1.73041508e-01 1.31776934e+01\n -6.16435051e+00 6.13341188e+00]]",
|
33 |
+
"cube_pos": "[[ 3.75709198e-18 -1.49811053e+00 -7.11882472e-01]\n [ 2.71410942e-02 -1.86346817e+00 -3.11859280e-01]\n [ 8.63602698e-18 -2.16332507e+00 -5.38550377e-01]\n [-6.76772583e-18 -1.90781951e+00 -5.11672974e-01]\n [-1.40960560e-17 -1.94498193e+00 -3.29043001e-01]\n [-4.14381918e-18 -1.28160369e+00 -3.40630770e-01]\n [-8.33931647e-18 -1.78806448e+00 -5.08135915e-01]\n [-6.38513453e-03 -2.52190113e+00 -5.02415895e-01]\n [-7.43779719e-01 -1.69584012e+00 -3.69940072e-01]\n [-1.50489300e-01 -1.66572046e+00 -3.43266577e-01]\n [ 1.11467038e-17 -1.72903264e+00 -7.11758792e-01]\n [ 3.88190816e-18 -2.17732382e+00 -9.68255401e-02]\n [ 3.91672552e-01 -2.24906301e+00 -7.07658708e-01]\n [-3.00100178e-01 -2.01346850e+00 -6.21352196e-01]\n [-6.14052236e-01 -4.58295047e-01 -8.72766897e-02]\n [ 5.81117049e-02 -1.77307129e+00 -6.62560880e-01]\n [ 6.70395315e-01 -2.33354211e+00 -5.51519334e-01]\n [-6.29886621e-18 -1.92694318e+00 -5.45340598e-01]\n [-5.91086149e-01 -1.97943926e+00 -3.80522549e-01]\n [-1.81047022e-17 -1.11413717e+00 -7.32029378e-01]\n [-6.50174922e-18 -1.85987735e+00 -6.30405247e-01]\n [-3.02449337e-19 -1.48646283e+00 -5.32022297e-01]\n [ 5.84773898e-01 -1.76174223e+00 -6.54082835e-01]\n [-1.71831045e-18 -1.70402193e+00 -5.52734613e-01]\n [-5.64895165e-18 -1.22117853e+00 -5.30396342e-01]\n [ 4.17943120e-01 -8.25759947e-01 -2.04713389e-01]\n [-1.40229955e-01 -1.88499105e+00 -5.75305581e-01]\n [ 4.09536744e-13 -2.24416280e+00 -3.06164920e-01]\n [ 9.80315980e-18 -1.79982924e+00 -5.24592876e-01]\n [-5.29317260e-01 -1.47778821e+00 -4.45967853e-01]\n [-6.56292021e-01 -1.13717020e+00 4.86833490e-02]\n [ 7.84537375e-01 -2.05636072e+00 -6.68334663e-01]\n [ 6.64881319e-02 -2.13322759e+00 -2.30511054e-01]\n [-3.81739944e-01 -1.69499087e+00 -7.19615996e-01]\n [ 1.98743850e-01 -2.61979795e+00 -5.79533398e-01]\n [ 1.38192358e-17 -2.18250132e+00 -6.34893924e-02]\n [-6.24808848e-01 -2.76075816e+00 -2.84074426e-01]\n [ 1.14997668e-17 -1.68029356e+00 -4.40098971e-01]\n [-1.04404554e-01 -1.81305766e+00 -4.96869624e-01]\n [ 4.29627985e-01 -2.28907776e+00 -6.78387702e-01]\n [-1.09915570e-17 -1.32331181e+00 -3.11486006e-01]\n [-4.94473185e-18 -1.80554986e+00 -5.18592596e-01]\n [-4.89791870e-01 -1.52818882e+00 -3.62980545e-01]\n [ 4.07354355e-01 -1.83414721e+00 -4.49037790e-01]\n [-7.74908215e-02 -1.71844900e+00 -5.16492009e-01]\n [ 3.30010985e-18 -1.07133961e+00 -2.85969466e-01]\n [-4.51656041e-18 -1.48233902e+00 -2.58996338e-01]\n [-1.73463732e-01 -2.18039012e+00 -5.32102823e-01]]"
|
34 |
},
|
35 |
+
"_episode_num": 576,
|
36 |
"use_sde": true,
|
37 |
"sde_sample_freq": -1,
|
38 |
+
"_current_progress_remaining": 0.9875248,
|
39 |
"_stats_window_size": 100,
|
40 |
"ep_info_buffer": {
|
41 |
":type:": "<class 'collections.deque'>",
|
42 |
+
":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwFMN4+bExZeMAWyUS8iMAXSUR0BFxXwb2lEadX2UKGgGR8BYPJQLux8laAdLyGgIR0BFtxwqAjIJdX2UKGgGR8BYPJQLux8laAdLyGgIR0BFqQQL/jsEdX2UKGgGR8BLxAnDziCKaAdLyGgIR0BFmuF6AvtddX2UKGgGR8BYPJQLux8laAdLyGgIR0BKaGQjlgc+dX2UKGgGR8BX6XocJdB0aAdLyGgIR0BKWfBN21UmdX2UKGgGR8BYPJQP7N0OaAdLyGgIR0BKS7uUliSadX2UKGgGR8BYPJQLux8laAdLyGgIR0BKPZX+2mYTdX2UKGgGR8BYPJQLux8laAdLyGgIR0BKL2LxZuAJdX2UKGgGR8BYPJQLux8laAdLyGgIR0BKIS7f51vEdX2UKGgGR8BYPJQLux8laAdLyGgIR0BKEwIMSbpedX2UKGgGR8BYOqtDD0lJaAdLyGgIR0BKBNtQ9A5adX2UKGgGR8BG7FspG4I9aAdLyGgIR0BJ9ri2lVLjdX2UKGgGR8BW4NK7I1cdaAdLyGgIR0BJ6JJPIn0DdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJ2l5GBnSOdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJzDWkJrtWdX2UKGgGR8BOgsXSBshxaAdLyGgIR0BJvgqur6tUdX2UKGgGR8Av3BOYYzi0aAdLyGgIR0BJryvTw2ETdX2UKGgGR0Cg/N127nPnaAdLyGgIR0BJoG5+YtxudX2UKGgGR8BP/b5Ec81XaAdLyGgIR0BJjskyDZlGdX2UKGgGR8AusNT987ZGaAdLyGgIR0BJgJb2USqVdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJcneBQN1AdX2UKGgGR8BX5T8tPHktaAdLyGgIR0BJZFXq7iAEdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJVizkZJkHdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJSA1ejVQRdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJOcqOLiuMdX2UKGgGR8BACTg2qDK6aAdLyGgIR0BJK5mAbyYpdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJHX0XgtOEdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJD1SOzY29dX2UKGgGR8BYLkDU3GXHaAdLyGgIR0BJATHbRF7VdX2UKGgGR8BNTTj3mFJyaAdLyGgIR0BI8w+2VmjCdX2UKGgGR8BYOEqYqoZRaAdLyGgIR0BI5OrZJ04jdX2UKGgGR8BYPJQLux8laAdLyGgIR0BI1p9y925hdX2UKGgGR8BXcK+Jxeb/aAdLyGgIR0BIyIs7MgU2dX2UKGgGR8BVeJw0fozOaAdLyGgIR0BIumQjlgc+dX2UKGgGR8BN76WgOBlMaAdLyGgIR0BIrEIw/PgOdX2UKGgGR8BX2F0PpY9xaAdLyGgIR0BImiDVYp2EdX2UKGgGR8BYPJQLux8laAdLyGgIR0BIi/dAPd2xdX2UKGgGR8BMAAv114gSaAdLyGgIR0BIfdAxBVuKdX2UKGgGR8BYPJQLux8laAdLyGgIR0BIb7UwztTldX2UKGgGR8BYPJQLux8laAdLyGgIR0BIYXdbgTAWdX2UKGgGR8BYPJQLux8laAdLyGgIR0BIU0FB6a9cdX2UKGgGR8BXaBhDw6QvaAdLyGgIR0BIRR0U47zTdX2UKGgGR8BVO85fdAPeaAdLyGgIR0BINvva11GLdX2UKGgGR8BYPJQLux8laAdLyGgIR0BIKNwzch1UdX2UKGgGR8BYPJQLux8laAdLyGgIR0BIGsIVuaWpdX2UKGgGR8BXuf6GgzxgaAdLyGgIR0BIDJrULDyfdX2UKGgGR0CaTI6GgzxgaAdLyGgIR0BH/nbItDlYdX2UKGgGR8BLtWo3rD64aAdLyGgIR0BH8DFqBVdYdX2UKGgGR8BYPJQLux8laAdLyGgIR0BH4dGZuyeJdX2UKGgGR8BYPJQLux8laAdLyGgIR0BH07nX/YJ3dX2UKGgGR8BWA0Y0l7dBaAdLyGgIR0BHxZfD1oQGdX2UKGgGR8BYPJQLux8laAdLyGgIR0BMBafapPykdX2UKGgGR8BX5o2OyVv/aAdLyGgIR0BL9zGPxQSBdX2UKGgGR8BYPJQLux8laAdLyGgIR0BL6PuPV/c4dX2UKGgGR8BYPJQLux8laAdLyGgIR0BL2tR3u/lAdX2UKGgGR8BYPJQLux8laAdLyGgIR0BLzKJuVHFxdX2UKGgGR8BYPJQLux8laAdLyGgIR0BLvm0mdAgQdX2UKGgGR8BYPJQLux8laAdLyGgIR0BLsD8tPHktdX2UKGgGR8A8n4tpVS4waAdLyGgIR0BLohcZ9/jLdX2UKGgGR8BArl3yI55raAdLyGgIR0BLk/NJOFg2dX2UKGgGR8BViCd4FA3UaAdLyGgIR0BLhcyN4qwydX2UKGgGR8BYPJQLux8laAdLyGgIR0BLd5c9nscAdX2UKGgGR8BYPJQLux8laAdLyGgIR0BLaWweNkvsdX2UKGgGR8BVUq8L8aXKaAdLyGgIR0BLWz/IbOu8dX2UKGgGR8BUgwIUrTYvaAdLyGgIR0BLTF/H5rP/dX2UKGgGR0C2dF33Hq/uaAdLyGgIR0BLPaEi+tbLdX2UKGgGR8A7M2WIGhVVaAdLyGgIR0BLK/qX4TK1dX2UKGgGR8BQ9sERraduaAdLyGgIR0BLHccuJ1q4dX2UKGgGR8BYPJQLux8laAdLyGgIR0BLD6a9bor4dX2UKGgGR8BXoZaePJaJaAdLyGgIR0BLAYQrc0tRdX2UKGgGR8BYPJQLux8laAdLyGgIR0BK81oQFs55dX2UKGgGR8BYPJQLux8laAdLyGgIR0BK5TmfXf65dX2UKGgGR8BYPJQLux8laAdLyGgIR0BK1vWxyGSIdX2UKGgGR8BWiHsTnJT3aAdLyGgIR0BKyMOwxFiKdX2UKGgGR8BYPJQLux8laAdLyGgIR0BKuqYqoZQ6dX2UKGgGR8BYPJQLux8laAdLyGgIR0BKrHx8UmD2dX2UKGgGR8BYNxY7q6e5aAdLyGgIR0BKnliSaEzwdX2UKGgGR8BTQS/fwZwXaAdLyGgIR0BKkDVH4GlidX2UKGgGR8BYPE7GNrCWaAdLyGgIR0BKgg93bEgodX2UKGgGR8BYPJQLux8laAdLyGgIR0BKc8LronrqdX2UKGgGR8BXpWD6Fds0aAdLyGgIR0BKZa2F36hydX2UKGgGR8BVSn3g1m8NaAdLyGgIR0BKV4V6/qPfdX2UKGgGR8BVKfo7muDBaAdLyGgIR0BKSWJaaCtjdX2UKGgGR8BX3EtVaOghaAdLyGgIR0BKNz4cm0E6dX2UKGgGR8BYPJQLux8laAdLyGgIR0BKKRNRFZxJdX2UKGgGR8BVt1XeWOZLaAdLyGgIR0BKGuryUcGUdX2UKGgGR8BYPJQLux8laAdLyGgIR0BKDM+V1Oj7dX2UKGgGR8BYPJQLux8laAdLyGgIR0BJ/pBgNPP+dX2UKGgGR8BYPJQLux8laAdLyGgIR0BJ8FkH2RJVdX2UKGgGR8BXP5vLowEhaAdLyGgIR0BJ4jO1OTJRdX2UKGgGR8BVrlxn3+MqaAdLyGgIR0BJ1BGH58BudX2UKGgGR8BYPJQLux8laAdLyGgIR0BJxfChvitJdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJt9U0elsQdX2UKGgGR8BXrVEVnEl3aAdLyGgIR0BJqay8jAzpdX2UKGgGR0CX1ZPZqVQiaAdLyGgIR0BJm4eDFqBVdX2UKGgGR8BX3ivX9R77aAdLyGgIR0BJjUEHMUypdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJfuBDohZAdX2UKGgGR8BYPJQLux8laAdLyGgIR0BJcMdDIBBBdX2UKGgGR8BXbGTX8O0+aAdLyGgIR0BJYqQRwqAjdWUu"
|
43 |
},
|
44 |
"ep_success_buffer": {
|
45 |
":type:": "<class 'collections.deque'>",
|
46 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
47 |
},
|
48 |
+
"_n_updates": 2597,
|
49 |
"observation_space": {
|
50 |
":type:": "<class 'gymnasium.spaces.dict.Dict'>",
|
51 |
":serialized:": "gAWVzAMAAAAAAACMFWd5bW5hc2l1bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojAhhcm1fcXBvc5SMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBgAAAAAAAAABAQEBAQGUaBOMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBoWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBwolgYAAAAAAAAAAQEBAQEBlGggSwaFlGgkdJRSlIwGX3NoYXBllEsGhZSMA2xvd5RoHCiWGAAAAAAAAADbD0nA2w9JwNsPScDbD0nA2w9JwNsPScCUaBZLBoWUaCR0lFKUjARoaWdolGgcKJYYAAAAAAAAANsPSUDbD0lA2w9JQNsPSUDbD0lA2w9JQJRoFksGhZRoJHSUUpSMCGxvd19yZXBylIwKLTMuMTQxNTkyN5SMCWhpZ2hfcmVwcpSMCTMuMTQxNTkyN5SMCl9ucF9yYW5kb22UTnVijAhhcm1fcXZlbJRoDSmBlH2UKGgQaBZoGWgcKJYGAAAAAAAAAAEBAQEBAZRoIEsGhZRoJHSUUpRoJ2gcKJYGAAAAAAAAAAEBAQEBAZRoIEsGhZRoJHSUUpRoLEsGhZRoLmgcKJYYAAAAAAAAAAAAIMEAACDBAAAgwQAAIMEAACDBAAAgwZRoFksGhZRoJHSUUpRoM2gcKJYYAAAAAAAAAAAAIEEAACBBAAAgQQAAIEEAACBBAAAgQZRoFksGhZRoJHSUUpRoOIwFLTEwLjCUaDqMBDEwLjCUaDxOdWKMCGN1YmVfcG9zlGgNKYGUfZQoaBBoFmgZaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgnaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgsSwOFlGguaBwolgwAAAAAAAAAAAAgwQAAIMEAACDBlGgWSwOFlGgkdJRSlGgzaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YnVoLE5oEE5oPE51Yi4=",
|
|
|
83 |
"__module__": "stable_baselines3.common.buffers",
|
84 |
"__annotations__": "{'observation_space': <class 'gymnasium.spaces.dict.Dict'>, 'obs_shape': typing.Dict[str, typing.Tuple[int, ...]], 'observations': typing.Dict[str, numpy.ndarray], 'next_observations': typing.Dict[str, numpy.ndarray]}",
|
85 |
"__doc__": "\n Dict Replay buffer used in off-policy algorithms like SAC/TD3.\n Extends the ReplayBuffer to use dictionary observations\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n Disabled for now (see https://github.com/DLR-RM/stable-baselines3/pull/243#discussion_r531535702)\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
86 |
+
"__init__": "<function DictReplayBuffer.__init__ at 0x7f4fa7fa9f30>",
|
87 |
+
"add": "<function DictReplayBuffer.add at 0x7f4fa7fa9fc0>",
|
88 |
+
"sample": "<function DictReplayBuffer.sample at 0x7f4fa7faa050>",
|
89 |
+
"_get_samples": "<function DictReplayBuffer._get_samples at 0x7f4fa7faa0e0>",
|
90 |
"__abstractmethods__": "frozenset()",
|
91 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f4fa81a7740>"
|
92 |
},
|
93 |
"replay_buffer_kwargs": {},
|
94 |
"train_freq": {
|
tqc-LiftCube-v0/ent_coef_optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1940
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b729f55979f95a3e059e89983e722df7e5f98a9eaeb7cd23839e2f4be6cd8377
|
3 |
size 1940
|
tqc-LiftCube-v0/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1548985
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fa397032689675c79f2497cb4ef994eefdf607d40f7902d86370dc3e60bd683
|
3 |
size 1548985
|
tqc-LiftCube-v0/pytorch_variables.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1180
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44a9c62c012cbe1e84a392152bb67776d2536710ff79bed99d8f9e1146b7441b
|
3 |
size 1180
|
train_eval_metrics.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52c839271da2475b755417cfef0947a4f1bba0dc98caf5757dc0ef4a7b17eb03
|
3 |
+
size 145046
|