Commit
·
f7c6333
1
Parent(s):
eb134e4
Initial commit
Browse files- README.md +1 -1
- replay.mp4 +2 -2
- results.json +1 -1
- tqc-ReachCube-v0.zip +2 -2
- tqc-ReachCube-v0/actor.optimizer.pth +1 -1
- tqc-ReachCube-v0/critic.optimizer.pth +1 -1
- tqc-ReachCube-v0/data +16 -16
- tqc-ReachCube-v0/ent_coef_optimizer.pth +1 -1
- tqc-ReachCube-v0/policy.pth +1 -1
- tqc-ReachCube-v0/pytorch_variables.pth +1 -1
- train_eval_metrics.zip +2 -2
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: ReachCube-v0
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value: -
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: ReachCube-v0
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: -62.33 +/- 29.66
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49a09daac0230127a0e8efd9dad29f0b7ab429b0e9a24502ef238788f0cd0967
|
3 |
+
size 823603
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward": -
|
|
|
1 |
+
{"mean_reward": -62.3253778, "std_reward": 29.662999394691855, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-06-13T15:34:07.710095"}
|
tqc-ReachCube-v0.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d27ffe604b4d41b1f591f1265afaaa42cd86ce308add044172d684c484c9582
|
3 |
+
size 3417950
|
tqc-ReachCube-v0/actor.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 589975
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08b303fcc966d40e20f7131fea0b9b388cf1589f757c480553d1bcefbcce3b31
|
3 |
size 589975
|
tqc-ReachCube-v0/critic.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1255594
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19f9d2fa2fdc19a9053facd74c5e95ddd9d5a2a6a7604cf97a6606706b4a70d2
|
3 |
size 1255594
|
tqc-ReachCube-v0/data
CHANGED
@@ -4,15 +4,15 @@
|
|
4 |
":serialized:": "gAWVMQAAAAAAAACMGHNiM19jb250cmliLnRxYy5wb2xpY2llc5SMEE11bHRpSW5wdXRQb2xpY3mUk5Qu",
|
5 |
"__module__": "sb3_contrib.tqc.policies",
|
6 |
"__doc__": "\n Policy class (with both actor and critic) for TQC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_quantiles: Number of quantiles for the critic.\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
|
7 |
-
"__init__": "<function MultiInputPolicy.__init__ at
|
8 |
"__abstractmethods__": "frozenset()",
|
9 |
-
"_abc_impl": "<_abc._abc_data object at
|
10 |
},
|
11 |
"verbose": 1,
|
12 |
"policy_kwargs": {
|
13 |
"use_sde": true
|
14 |
},
|
15 |
-
"num_timesteps":
|
16 |
"_total_timesteps": 10000000,
|
17 |
"_num_timesteps_at_start": 0,
|
18 |
"seed": 0,
|
@@ -27,25 +27,25 @@
|
|
27 |
},
|
28 |
"_last_original_obs": {
|
29 |
":type:": "<class 'collections.OrderedDict'>",
|
30 |
-
":serialized:": "
|
31 |
-
"arm_qpos": "[[-0.
|
32 |
-
"arm_qvel": "[[-
|
33 |
-
"cube_pos": "[[ 0.
|
34 |
},
|
35 |
-
"_episode_num":
|
36 |
"use_sde": true,
|
37 |
"sde_sample_freq": -1,
|
38 |
-
"_current_progress_remaining": 0.
|
39 |
"_stats_window_size": 100,
|
40 |
"ep_info_buffer": {
|
41 |
":type:": "<class 'collections.deque'>",
|
42 |
-
":serialized:": "
|
43 |
},
|
44 |
"ep_success_buffer": {
|
45 |
":type:": "<class 'collections.deque'>",
|
46 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
47 |
},
|
48 |
-
"_n_updates":
|
49 |
"observation_space": {
|
50 |
":type:": "<class 'gymnasium.spaces.dict.Dict'>",
|
51 |
":serialized:": "gAWVzAMAAAAAAACMFWd5bW5hc2l1bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojAhhcm1fcXBvc5SMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBgAAAAAAAAABAQEBAQGUaBOMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBoWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBwolgYAAAAAAAAAAQEBAQEBlGggSwaFlGgkdJRSlIwGX3NoYXBllEsGhZSMA2xvd5RoHCiWGAAAAAAAAADbD0nA2w9JwNsPScDbD0nA2w9JwNsPScCUaBZLBoWUaCR0lFKUjARoaWdolGgcKJYYAAAAAAAAANsPSUDbD0lA2w9JQNsPSUDbD0lA2w9JQJRoFksGhZRoJHSUUpSMCGxvd19yZXBylIwKLTMuMTQxNTkyN5SMCWhpZ2hfcmVwcpSMCTMuMTQxNTkyN5SMCl9ucF9yYW5kb22UTnVijAhhcm1fcXZlbJRoDSmBlH2UKGgQaBZoGWgcKJYGAAAAAAAAAAEBAQEBAZRoIEsGhZRoJHSUUpRoJ2gcKJYGAAAAAAAAAAEBAQEBAZRoIEsGhZRoJHSUUpRoLEsGhZRoLmgcKJYYAAAAAAAAAAAAIMEAACDBAAAgwQAAIMEAACDBAAAgwZRoFksGhZRoJHSUUpRoM2gcKJYYAAAAAAAAAAAAIEEAACBBAAAgQQAAIEEAACBBAAAgQZRoFksGhZRoJHSUUpRoOIwFLTEwLjCUaDqMBDEwLjCUaDxOdWKMCGN1YmVfcG9zlGgNKYGUfZQoaBBoFmgZaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgnaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgsSwOFlGguaBwolgwAAAAAAAAAAAAgwQAAIMEAACDBlGgWSwOFlGgkdJRSlGgzaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YnVoLE5oEE5oPE51Yi4=",
|
@@ -83,12 +83,12 @@
|
|
83 |
"__module__": "stable_baselines3.common.buffers",
|
84 |
"__annotations__": "{'observation_space': <class 'gymnasium.spaces.dict.Dict'>, 'obs_shape': typing.Dict[str, typing.Tuple[int, ...]], 'observations': typing.Dict[str, numpy.ndarray], 'next_observations': typing.Dict[str, numpy.ndarray]}",
|
85 |
"__doc__": "\n Dict Replay buffer used in off-policy algorithms like SAC/TD3.\n Extends the ReplayBuffer to use dictionary observations\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n Disabled for now (see https://github.com/DLR-RM/stable-baselines3/pull/243#discussion_r531535702)\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
86 |
-
"__init__": "<function DictReplayBuffer.__init__ at
|
87 |
-
"add": "<function DictReplayBuffer.add at
|
88 |
-
"sample": "<function DictReplayBuffer.sample at
|
89 |
-
"_get_samples": "<function DictReplayBuffer._get_samples at
|
90 |
"__abstractmethods__": "frozenset()",
|
91 |
-
"_abc_impl": "<_abc._abc_data object at
|
92 |
},
|
93 |
"replay_buffer_kwargs": {},
|
94 |
"train_freq": {
|
|
|
4 |
":serialized:": "gAWVMQAAAAAAAACMGHNiM19jb250cmliLnRxYy5wb2xpY2llc5SMEE11bHRpSW5wdXRQb2xpY3mUk5Qu",
|
5 |
"__module__": "sb3_contrib.tqc.policies",
|
6 |
"__doc__": "\n Policy class (with both actor and critic) for TQC.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param use_expln: Use ``expln()`` function instead of ``exp()`` when using gSDE to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param clip_mean: Clip the mean output when using gSDE to avoid numerical instability.\n :param features_extractor_class: Features extractor to use.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_quantiles: Number of quantiles for the critic.\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
|
7 |
+
"__init__": "<function MultiInputPolicy.__init__ at 0x7f3b3e53b7f0>",
|
8 |
"__abstractmethods__": "frozenset()",
|
9 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f3b3e53ff80>"
|
10 |
},
|
11 |
"verbose": 1,
|
12 |
"policy_kwargs": {
|
13 |
"use_sde": true
|
14 |
},
|
15 |
+
"num_timesteps": 899712,
|
16 |
"_total_timesteps": 10000000,
|
17 |
"_num_timesteps_at_start": 0,
|
18 |
"seed": 0,
|
|
|
27 |
},
|
28 |
"_last_original_obs": {
|
29 |
":type:": "<class 'collections.OrderedDict'>",
|
30 |
+
":serialized:": "gAWVrwQAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojAhhcm1fcXBvc5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJaAAQAAAAAAAMQecb05kUs/eiyUvxGzyD4UagY+JkiFv09DpD+2V7U+/gylv2tQAb+bRtq+OMaGvhroDr+9mDm9moy4voas0D9EA1e+VR2rv6RhTj9ZsUO+/TnjvhRe5r61M6k/3njLvRPRnD4/NSk/BA+ev1c1ub4tvYA/VFX+vucZdb0OleY+8k9uv4Gb0D7iCgi/BryYv8E0+L6whkY+lmEDv68NnT+5E2Y/2zeevzr+1T+FoYG/wX1/P2TymT6edvy9nKCKvF+Yuj9md+W+/NSUvpUWZL6+BE2+bHjvvdVkvz+MrVe/AHSqPgsbP76iU62/B2HNvldCGb9JDh8+MUYhv34P5T+VKq2+ME/Nv7QKxD+KWL++1OEKv/csAb/JO5g9zx+dv6GQLT+u6Yq/8vzXPvvlq79fEyM/GYtXvvwO/z4hTSU/Q2a6v0Fn2r4NzCI/WO0qv20Jvj/ttxm+8PYbv0PRNr7NNgS/RhUKvxphEj++mDQ/A1+6v1c1ub50Kx0/gIAbv5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsGhpSMAUOUdJRSlIwIYXJtX3F2ZWyUaAcoloABAAAAAAAAOjIbwHeLbsC0b/+/JwK5wANqoMAIjp9ATLkevxx/H79ie7G/AsrTwNiensBlvJ1Aq2h6v358j7+pGrY/OcJDQPyWm8AS/J/ALlLxPyRJosDgnYy8kHd+QLS4n0Bv3p3AJfkiQBUq7j9HlAJBQmD2wJvEm8AdUpPA7aDhv4w8+z/T8Zg/8lBTQOINoMD425/A2ygEPxg0wL9VcHBAMDkvP/UmkcCVq5rAXAGRP8IDl7/260lALHo9wIjslkD865XAssYswHMDNkDKripAhVnKwPPhs8Bcl4FA7DWHP9Z0qMBkFTRAiLqPQHnLn8CTXpxAWO80PeZg+j9zEFu+T1J7QPaonMCHKyDAjsJiQBO/iT93sSnASFwfwPNnn0CzlpjANyODv5BQFb8SpQnAeaSZQIL+n8C3AKFAM6Lyv2VDQ8DirgLAhXK4wMCsssBXG6BAfq3cP9ZAo79PEbq/J4atwLvTn8BDi6BA31TnPsYFPsBiHdW/cOS/wJtNrMCrLqFAlGgOSxBLBoaUaBJ0lFKUjAhjdWJlX3Bvc5RoByiWwAAAAAAAAAC218c9+4MgPfR6dTzeTyu+/8jYvPR6dTwGDiA+JZ3+PfR6dTzG+wG+QRfUPfF5dTz9Fpu8MClmPfR6dTxsCK49kDTcPdt0dTwdwxA+9y8VPuArbjwgARC/n3HEvZ91nzzKCua+Cwq9Pax6dTzwTG6+QKiuuvR6dTzP7y0+0xegPfR6dTxP0kO/djqFPeSggDwKlNa9fpKuPvR6dTw6hTm9Ron6PPR6dTwgroa+lnnGvOouaDyFZSy91plou/J6dTyUaA5LEEsDhpRoEnSUUpR1Lg==",
|
31 |
+
"arm_qpos": "[[-0.05886723 0.7951847 -1.1576073 0.39199117 0.13126403 -1.0412643 ]\n [ 1.2833041 0.3541848 -1.289459 -0.50513333 -0.42631993 -0.26323104]\n [-0.5582291 -0.04531168 -0.3604477 1.630265 -0.2099734 -1.3368326 ]\n [ 0.8061774 -0.19110622 -0.4438018 -0.4499365 1.3218905 -0.09935163]\n [ 0.3062826 0.6609687 -1.2348332 -0.36173508 1.0057732 -0.49674475]\n [-0.05983916 0.45035595 -0.93090737 0.4074364 -0.53141606 -1.193238 ]\n [-0.48477748 0.19387317 -0.5132078 1.2269801 0.89873844 -1.2360796 ]\n [ 1.6718209 -1.0127417 0.9980126 0.30067742 -0.12327312 -0.01692229]\n [ 1.457775 -0.44817656 -0.29068744 -0.2227424 -0.2002134 -0.11692891]\n [ 1.4952646 -0.84249187 0.33291626 -0.1866266 -1.3541148 -0.40113088]\n [-0.5986685 0.15532793 -0.6299773 1.7895353 -0.3382155 -1.6039791 ]\n [ 1.5315766 -0.37372237 -0.54250836 -0.50459236 0.07433278 -1.2275332 ]\n [ 0.6779881 -1.0852563 0.4218517 -1.342956 0.6370143 -0.21049155]\n [ 0.4981612 0.64570814 -1.4562458 -0.426569 0.63592607 -0.6676841 ]\n [ 1.4846627 -0.15011568 -0.6092367 -0.17853265 -0.5164612 -0.5393871 ]\n [ 0.57179415 0.70545566 -1.4560245 -0.36173508 0.6139443 -0.6074295 ]]",
|
32 |
+
"arm_qvel": "[[-2.4249406 -3.7272623 -1.9955964 -5.7815127 -5.012941 4.986088 ]\n [-0.6200149 -0.6230333 -1.3865778 -6.618409 -4.95689 4.9292474 ]\n [-0.9781596 -1.1209867 1.4226886 3.0587294 -4.8621807 -4.9995203 ]\n [ 1.8853204 -5.0714283 -0.01716512 3.9760475 4.991297 -4.9334025 ]\n [ 2.5464566 1.8606592 8.161201 -7.69925 -4.8677497 -4.6037736 ]\n [-1.7627236 1.9627852 1.1948799 3.3018155 -5.0016947 -4.9956017 ]\n [ 0.5162484 -1.5015898 3.7568562 0.68446636 -4.5360055 -4.833445 ]\n [ 1.132854 -1.1798022 3.155027 -2.9605818 4.7163734 -4.6850567 ]\n [-2.6996274 2.8439605 2.6669183 -6.3234277 -5.6213317 4.0497265 ]\n [ 1.0563331 -5.264262 2.8138056 4.49152 -4.993588 4.8865447 ]\n [ 0.04417357 1.9560821 -0.21392994 3.9268987 -4.895625 -2.5026567 ]\n [ 3.5431247 1.0761436 -2.6514566 -2.4900074 4.981439 -4.768396 ]\n [-1.0245122 -0.58326054 -2.1507 4.801327 -4.999818 5.0313373 ]\n [-1.8955749 -3.0509884 -2.041924 -5.7639794 -5.5835876 5.0033374 ]\n [ 1.7240446 -1.2754161 -1.4536532 -5.422626 -4.994596 5.0169997 ]\n [ 0.4518194 -2.9691024 -1.6649592 -5.9966354 -5.3844733 5.036947 ]]",
|
33 |
+
"cube_pos": "[[ 0.0975794 0.03918837 0.01498293]\n [-0.16729686 -0.02646303 0.01498293]\n [ 0.1563035 0.12432317 0.01498293]\n [-0.126937 0.10355998 0.01498269]\n [-0.01893186 0.05619162 0.01498293]\n [ 0.084977 0.10752213 0.01498147]\n [ 0.1413693 0.14569078 0.01453683]\n [-0.56251717 -0.09591984 0.01946527]\n [-0.44930106 0.09230431 0.01498286]\n [-0.23271537 -0.00133253 0.01498293]\n [ 0.16986011 0.07817044 0.01498293]\n [-0.7649278 0.06505291 0.01570172]\n [-0.10477455 0.3409614 0.01498293]\n [-0.04529307 0.03058304 0.01498293]\n [-0.26304722 -0.0242279 0.01417134]\n [-0.042089 -0.00354921 0.01498293]]"
|
34 |
},
|
35 |
+
"_episode_num": 1792,
|
36 |
"use_sde": true,
|
37 |
"sde_sample_freq": -1,
|
38 |
+
"_current_progress_remaining": 0.9100304,
|
39 |
"_stats_window_size": 100,
|
40 |
"ep_info_buffer": {
|
41 |
":type:": "<class 'collections.deque'>",
|
42 |
+
":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwDtyUnogV46MAWyUTfQBjAF0lEdAkMoeHJtBOnV9lChoBkfAQSetbLU1AWgHTfQBaAhHQJDJqv8qFyt1fZQoaAZHwEr+W3Sa3JBoB030AWgIR0CQyTd5Y5ktdX2UKGgGR8BGHKTB68g7aAdN9AFoCEdAkMikFbFCLXV9lChoBkfAcFS6C17Y02gHTfQBaAhHQJEA0+mm+Cd1fZQoaAZHwEiGQiiZfD1oB030AWgIR0CRAFuBtk4FdX2UKGgGR8BGoE/8l5WzaAdN9AFoCEdAkP/nBk7OmnV9lChoBkfARjQrvsqrimgHTfQBaAhHQJD/c9FF2FF1fZQoaAZHwEeEvjfek59oB030AWgIR0CQ/wAcT8HfdX2UKGgGR8BCmgh0Qsf8aAdN9AFoCEdAkP6Mbm2b5XV9lChoBkfAby/apPykK2gHTfQBaAhHQJD+Gd+Xqqx1fZQoaAZHwGR88k2P1ctoB030AWgIR0CQ/aMz/IbPdX2UKGgGR8BHzbaqS5iFaAdN9AFoCEdAkP0v7zkIX3V9lChoBkfASj88PnSv1WgHTfQBaAhHQJD8vCrLhaV1fZQoaAZHwEeMSPluFYdoB030AWgIR0CQ/EfapPykdX2UKGgGR8BN6ClJpWWAaAdN9AFoCEdAkPvTkQwsXnV9lChoBkfAVCMrK/20zGgHTfQBaAhHQJD7X6ZYxL11fZQoaAZHwEVUT/Q0GeNoB030AWgIR0CQ+uyFPBSDdX2UKGgGR8BRtkOiFj/daAdN9AFoCEdAkPp4+r2g4HV9lChoBkfARMQxFiKBNGgHTfQBaAhHQJD55Y1YQrd1fZQoaAZHwFNgAJ9iMHdoB030AWgIR0CRI2jrzGxVdX2UKGgGR8BKqfSH/LkkaAdN9AFoCEdAkSLwjyFwk3V9lChoBkfAQpXkeZG8VmgHTfQBaAhHQJEifA6+36R1fZQoaAZHwEgLmITGo75oB030AWgIR0CRIgjZtelbdX2UKGgGR8Bk5tAgPmPpaAdN9AFoCEdAkSGVJg9eQnV9lChoBkfAX4BVghKUV2gHTfQBaAhHQJEhIX3xnWd1fZQoaAZHwEJRwy6+WW1oB030AWgIR0CRIK7qIJqqdX2UKGgGR8BMY0Y0l7dBaAdN9AFoCEdAkSA4PkJa7nV9lChoBkfAQajakAPuomgHTfQBaAhHQJEfxPxhDw91fZQoaAZHwEGypcX3xnZoB030AWgIR0CRH1E5QxetdX2UKGgGR8BlFi5TZQHiaAdN9AFoCEdAkR7c6V+qi3V9lChoBkfATYJokAxSHmgHTfQBaAhHQJEeaJ1q33J1fZQoaAZHwGExgm7aqS5oB030AWgIR0CRHfSr5qM4dX2UKGgGR8BI4mdqcmShaAdN9AFoCEdAkR2BikO7QXV9lChoBkfATL/zlLeyiWgHTfQBaAhHQJEdDgEU0vZ1fZQoaAZHwEVJfNzKcNJoB030AWgIR0CRHHqR2bG4dX2UKGgGR8BIYDv/io87aAdN9AFoCEdAkUYJnYg7o3V9lChoBkfAZmqJlar3kGgHTfQBaAhHQJFFkUIsyzp1fZQoaAZHwEBS2n889wFoB030AWgIR0CRRRzAvcrRdX2UKGgGR8BI4NI065oXaAdN9AFoCEdAkUSpjlPrOnV9lChoBkfAWC1BMSK3u2gHTfQBaAhHQJFENdrwe/51fZQoaAZHwFktQ1aW5YpoB030AWgIR0CRQ8IuoP07dX2UKGgGR8BMYiT+vQnhaAdN9AFoCEdAkUNPm9xp+XV9lChoBkfASwaFGoaUA2gHTfQBaAhHQJFC2PDHfdh1fZQoaAZHwE5m4R28qWloB030AWgIR0CRQmWsijcmdX2UKGgGR8BEi/1QIldDaAdN9AFoCEdAkUHx6nivPnV9lChoBkfASiuR3eN1hmgHTfQBaAhHQJFBfZvkzXV1fZQoaAZHwER3cQAdXDFoB030AWgIR0CRQQlQuVX4dX2UKGgGR8BZqxsZYPoWaAdN9AFoCEdAkUCVYhdMTXV9lChoBkfAYV16E8JUpGgHTfQBaAhHQJFAIkRjBmB1fZQoaAZHwFTzn/kvK2doB030AWgIR0CRP668QI2PdX2UKGgGR8BFJad+XqqwaAdN9AFoCEdAkT8bTDwYtXV9lChoBkfAcOlXkHUtqmgHTfQBaAhHQJF84LfDUEx1fZQoaAZHwFckk1Muez5oB030AWgIR0CRfGhW5paidX2UKGgGR8B1NpIy0rsjaAdN9AFoCEdAkXvz1oQFtHV9lChoBkfASuo8uBczImgHTfQBaAhHQJF7gKUmlZZ1fZQoaAZHwEUb4gRsdktoB030AWgIR0CRewz5oGpudX2UKGgGR8CD0FZElVtGaAdN9AFoCEdAkXqZTMqz7nV9lChoBkfAYIPdhRZU1mgHTfQBaAhHQJF6JrzoUzt1fZQoaAZHwEUJL7oB7u5oB030AWgIR0CRebAP/aQFdX2UKGgGR8BIQ15Sm65HaAdN9AFoCEdAkXk8yvcJt3V9lChoBkfARdkmQbMot2gHTfQBaAhHQJF4yQwK0D51fZQoaAZHwENew7kn1FpoB030AWgIR0CReFS88La3dX2UKGgGR8BMJetKZlWfaAdN9AFoCEdAkXfgb+98JHV9lChoBkfARBgao/A0sWgHTfQBaAhHQJF3bH5rP+p1fZQoaAZHwEdwmG/N7jVoB030AWgIR0CRdvlcyFfzdX2UKGgGR8BR3aLS/j82aAdN9AFoCEdAkXaF0YCQtHV9lChoBkfAQuPeenQ6ZGgHTfQBaAhHQJF18mOU+s51fZQoaAZHwEns25xzaK1oB030AWgIR0CRm0OPNmlJdX2UKGgGR8BAOxkupS75aAdN9AFoCEdAkZrLNSqEOHV9lChoBkfAS/JBX0XgtWgHTfQBaAhHQJGaVrYXfqJ1fZQoaAZHwEh0cDr7fpFoB030AWgIR0CRmeOM2m52dX2UKGgGR8BJLV50KZ2IaAdN9AFoCEdAkZlv20zCUHV9lChoBkfARHA1cdHUdGgHTfQBaAhHQJGY/DDTBqN1fZQoaAZHwEX0BKcurZJoB030AWgIR0CRmImnfl6rdX2UKGgGR8BkVLORkmQbaAdN9AFoCEdAkZgS/sVtXXV9lChoBkfAT7+lyimEXmgHTfQBaAhHQJGXn73wkPd1fZQoaAZHwEIS25xzaK1oB030AWgIR0CRlyv9tMwldX2UKGgGR8BeV9bTtsvaaAdN9AFoCEdAkZa3sgMc63V9lChoBkfAUT2Op84Pw2gHTfQBaAhHQJGWQ2jwhGJ1fZQoaAZHwHIT4O+ZgG9oB030AWgIR0CRlc97WuoxdX2UKGgGR8BBCIlMRHwxaAdN9AFoCEdAkZVcW9DhL3V9lChoBkfAUZO1D0Dlo2gHTfQBaAhHQJGU6NYKYzB1fZQoaAZHwD7H0pVjqfRoB030AWgIR0CRlFVsDW9UdX2UKGgGR8BIEr+YMOPOaAdN9AFoCEdAkbo8uzyBkXV9lChoBkfAQzvmPo3aSWgHTfQBaAhHQJG5xFOO8011fZQoaAZHwEJZ9Wp6yB1oB030AWgIR0CRuU/O+qR2dX2UKGgGR8BC8el0o0AMaAdN9AFoCEdAkbjcmfGuLnV9lChoBkfAPXv/m1YyPGgHTfQBaAhHQJG4aOinHed1fZQoaAZHwEFgCkGiYb9oB030AWgIR0CRt/VBD5TIdX2UKGgGR8BD7a+WWyC4aAdN9AFoCEdAkbeCrgflqHV9lChoBkfATqCAQQL/j2gHTfQBaAhHQJG3DAeq7yx1fZQoaAZHwEJbf+jua4NoB030AWgIR0CRtpjENvwWdX2UKGgGR8A/ADdP+GXYaAdN9AFoCEdAkbYlAAyVOnV9lChoBkfAUHiVdHDrJWgHTfQBaAhHQJG1sLeANG51fZQoaAZHwEdG814xDb9oB030AWgIR0CRtTxs2vSudX2UKGgGR8BPQBTn7pFDaAdN9AFoCEdAkbTIfOlfq3V9lChoBkfARXMuL74zrWgHTfQBaAhHQJG0VVp9JBh1fZQoaAZHwEP/RvWH1vloB030AWgIR0CRs+HRCx/vdX2UKGgGR8BKj6SLZSNwaAdN9AFoCEdAkbNOY6XBxnVlLg=="
|
43 |
},
|
44 |
"ep_success_buffer": {
|
45 |
":type:": "<class 'collections.deque'>",
|
46 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
47 |
},
|
48 |
+
"_n_updates": 56225,
|
49 |
"observation_space": {
|
50 |
":type:": "<class 'gymnasium.spaces.dict.Dict'>",
|
51 |
":serialized:": "gAWVzAMAAAAAAACMFWd5bW5hc2l1bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojAhhcm1fcXBvc5SMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBgAAAAAAAAABAQEBAQGUaBOMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBoWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBwolgYAAAAAAAAAAQEBAQEBlGggSwaFlGgkdJRSlIwGX3NoYXBllEsGhZSMA2xvd5RoHCiWGAAAAAAAAADbD0nA2w9JwNsPScDbD0nA2w9JwNsPScCUaBZLBoWUaCR0lFKUjARoaWdolGgcKJYYAAAAAAAAANsPSUDbD0lA2w9JQNsPSUDbD0lA2w9JQJRoFksGhZRoJHSUUpSMCGxvd19yZXBylIwKLTMuMTQxNTkyN5SMCWhpZ2hfcmVwcpSMCTMuMTQxNTkyN5SMCl9ucF9yYW5kb22UTnVijAhhcm1fcXZlbJRoDSmBlH2UKGgQaBZoGWgcKJYGAAAAAAAAAAEBAQEBAZRoIEsGhZRoJHSUUpRoJ2gcKJYGAAAAAAAAAAEBAQEBAZRoIEsGhZRoJHSUUpRoLEsGhZRoLmgcKJYYAAAAAAAAAAAAIMEAACDBAAAgwQAAIMEAACDBAAAgwZRoFksGhZRoJHSUUpRoM2gcKJYYAAAAAAAAAAAAIEEAACBBAAAgQQAAIEEAACBBAAAgQZRoFksGhZRoJHSUUpRoOIwFLTEwLjCUaDqMBDEwLjCUaDxOdWKMCGN1YmVfcG9zlGgNKYGUfZQoaBBoFmgZaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgnaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgsSwOFlGguaBwolgwAAAAAAAAAAAAgwQAAIMEAACDBlGgWSwOFlGgkdJRSlGgzaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YnVoLE5oEE5oPE51Yi4=",
|
|
|
83 |
"__module__": "stable_baselines3.common.buffers",
|
84 |
"__annotations__": "{'observation_space': <class 'gymnasium.spaces.dict.Dict'>, 'obs_shape': typing.Dict[str, typing.Tuple[int, ...]], 'observations': typing.Dict[str, numpy.ndarray], 'next_observations': typing.Dict[str, numpy.ndarray]}",
|
85 |
"__doc__": "\n Dict Replay buffer used in off-policy algorithms like SAC/TD3.\n Extends the ReplayBuffer to use dictionary observations\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n Disabled for now (see https://github.com/DLR-RM/stable-baselines3/pull/243#discussion_r531535702)\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
86 |
+
"__init__": "<function DictReplayBuffer.__init__ at 0x7f3b3eeee3b0>",
|
87 |
+
"add": "<function DictReplayBuffer.add at 0x7f3b3eeee440>",
|
88 |
+
"sample": "<function DictReplayBuffer.sample at 0x7f3b3eeee4d0>",
|
89 |
+
"_get_samples": "<function DictReplayBuffer._get_samples at 0x7f3b3eeee560>",
|
90 |
"__abstractmethods__": "frozenset()",
|
91 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f3b3eee8340>"
|
92 |
},
|
93 |
"replay_buffer_kwargs": {},
|
94 |
"train_freq": {
|
tqc-ReachCube-v0/ent_coef_optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1940
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f081826a2e36045e49f74f9367025287c6eda5765bd2bca3df750016054ba1a
|
3 |
size 1940
|
tqc-ReachCube-v0/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1548985
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48d0c1ea42c7e6052c07ad60c0280d1d47cd33384d16f6ba09035fecd86ff4a7
|
3 |
size 1548985
|
tqc-ReachCube-v0/pytorch_variables.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1180
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ad2edb527813bfeb6d5184a424ad9cb638c8aab9ca2cddda86b7fa5d689164e
|
3 |
size 1180
|
train_eval_metrics.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:743070671f8db75cf8e1d4d82e7827a65d206b6d9f3c4712ee56c8be8ee51b8c
|
3 |
+
size 71115
|