diff --git a/checkpoints/ag4/benchmark_summary.txt b/checkpoints/ag4/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..3849a15c4aff44727eb99c3a176e538356da9135 --- /dev/null +++ b/checkpoints/ag4/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: antmaze-giant-navigate-singletask-task4-v0 +Agent: offline +Seed: 3 + +Evaluation (50 episodes): + Success Rate: 74.0% + Mean Return: -834.9 +======================================== diff --git a/checkpoints/ag4/params_online_sd000.pkl b/checkpoints/ag4/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..1f4f5457fa0352646b8fb279eb376d13a169f6a2 --- /dev/null +++ b/checkpoints/ag4/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b5b83c4b45fcc1e0720c19630a3581f07c33cb417c424168eee3a5ab89c2a11 +size 50691239 diff --git a/checkpoints/ag4/params_online_sd001.pkl b/checkpoints/ag4/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..e909d7538f236cb6a8383348f9b17be942022779 --- /dev/null +++ b/checkpoints/ag4/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5374cf256a0f0c78783b5bfed3e589fb0a58a060179aabe8a26cd550fc2cd4ec +size 50691239 diff --git a/checkpoints/ag4/params_online_sd002.pkl b/checkpoints/ag4/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..526529f945a2b04dc56d0ba13e5c8f8831fce0f6 --- /dev/null +++ b/checkpoints/ag4/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff3d12c480d5cc4460f61c46e66b69063669d80d581e5149bcdf6e5faf384d6 +size 50691239 diff --git a/checkpoints/ag4/params_online_sd003.pkl b/checkpoints/ag4/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..cf803ab1cf3e9c3fedec76e90bc706c7b7c807a1 --- /dev/null +++ b/checkpoints/ag4/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17392a63e293d271b0261be6cd24d73d0e06c41b7b76985d4861c5c703742131 +size 50691239 diff --git a/checkpoints/ag4/params_online_sd004.pkl b/checkpoints/ag4/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..d9fbe1bd347d3aff54258bd531a2be463f904268 --- /dev/null +++ b/checkpoints/ag4/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:220ffd640d9c8634de8ba22f451c60abf2fca5ecbab60c3602e818f9f9d745f1 +size 50691239 diff --git a/checkpoints/ag5/benchmark_summary.txt b/checkpoints/ag5/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad6959de14961f2ea2cb749c729df33ebf4ed724 --- /dev/null +++ b/checkpoints/ag5/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: antmaze-giant-navigate-singletask-task5-v0 +Agent: offline +Seed: 4 + +Evaluation (50 episodes): + Success Rate: 92.0% + Mean Return: -549.0 +======================================== diff --git a/checkpoints/ag5/params_online_sd000.pkl b/checkpoints/ag5/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..98f72dd9999459617af8c139d6ca9404cdfa3914 --- /dev/null +++ b/checkpoints/ag5/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea8ad82449dba5668b046b48c761a6b37e97ee07d0ea7b3d16d73714db91ef1 +size 50691239 diff --git a/checkpoints/ag5/params_online_sd001.pkl b/checkpoints/ag5/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0720205e54073e24fa9d0614b8e4e62ddc8f5ce4 --- /dev/null +++ b/checkpoints/ag5/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a258663106e83e1df7b0a3907c45d0e1ed45033bd12674faff5027b87827ab +size 50691239 diff --git a/checkpoints/ag5/params_online_sd002.pkl b/checkpoints/ag5/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..90adf579fb00ecfd7843348ea3106a91e13b687f --- /dev/null +++ b/checkpoints/ag5/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2da913a56e2e89a4ba280221c01d194ff26549df4e24fa4da8793d1e50b71f1 +size 50691239 diff --git a/checkpoints/ag5/params_online_sd003.pkl b/checkpoints/ag5/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..32b68626b17923a0cab4982ce19d68cb8e93cb8d --- /dev/null +++ b/checkpoints/ag5/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d120c7fcb5d81ce0ae7b0fb1aed2f635525dddf8ba0d5bd9412b4f357ea14cc9 +size 50691239 diff --git a/checkpoints/ag5/params_online_sd004.pkl b/checkpoints/ag5/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..de4d98964e4afc0da321a71dedd62f050d76af7f --- /dev/null +++ b/checkpoints/ag5/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bc2939fad8f1e4f1b7555fd49b0de3c2886d826f30ef67e31fad9277f0eae1e +size 50691239 diff --git a/checkpoints/can/benchmark_summary.txt b/checkpoints/can/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..74811eb6c7f0c76d81bc174901c6c47213b7dcb9 --- /dev/null +++ b/checkpoints/can/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: can-mh-low_dim +Agent: offline +Seed: 3 + +Evaluation (50 episodes): + Success Rate: 94.0% + Mean Return: 0.9 +======================================== diff --git a/checkpoints/can/params_online_sd000.pkl b/checkpoints/can/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..9f2884c1d0c2ab960b35f268ee4898561bfa2a8f --- /dev/null +++ b/checkpoints/can/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9103b339c739720bcd30cae90ccaaf9ea22ee64eecf9329b9035539dd3edb63e +size 50322539 diff --git a/checkpoints/can/params_online_sd001.pkl b/checkpoints/can/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..a19e7df72a4dd6111fb3edfd0842d5559a06c1c7 --- /dev/null +++ b/checkpoints/can/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1135d5875c4d36f954f5bc98e9fb989f0db833b3bfead85615231ed29d224001 +size 50322539 diff --git a/checkpoints/can/params_online_sd002.pkl b/checkpoints/can/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..c4c6f97ebff3503d61a34470831ab3b26f2e4c86 --- /dev/null +++ b/checkpoints/can/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7d72fa42a28544aa52931c9314825238b6976c1706f3d00d402bebc7aa2ea60 +size 50322539 diff --git a/checkpoints/can/params_online_sd003.pkl b/checkpoints/can/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..74f1feae938413928a66cbe9d177835c5ecd69d5 --- /dev/null +++ b/checkpoints/can/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4dc0b82eb7b9248de9bd05072f2d70b364376d417e1c2284b104bca719ea613 +size 50322539 diff --git a/checkpoints/can/params_online_sd004.pkl b/checkpoints/can/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..99ccefbe520cc3695d81138de0ff55b16051f5c9 --- /dev/null +++ b/checkpoints/can/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:752715b422ceb6f59982d283cbe184de127224a69887651a775d8018096ef975 +size 50322539 diff --git a/checkpoints/cdp3/benchmark_summary.txt b/checkpoints/cdp3/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..94d33de29239ab136082a36800d8666fe6d0880c --- /dev/null +++ b/checkpoints/cdp3/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: cube-double-play-singletask-task3-v0 +Agent: offline +Seed: 4 + +Evaluation (50 episodes): + Success Rate: 100.0% + Mean Return: -123.2 +======================================== diff --git a/checkpoints/cdp3/params_online_sd000.pkl b/checkpoints/cdp3/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..c68124864bfbb53f4ca8beab479213e02d144b6b --- /dev/null +++ b/checkpoints/cdp3/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ce5d544991d9826a5dd246f89ea8be50be3a93d307a3ac3d86174a28a03e15 +size 50383832 diff --git a/checkpoints/cdp3/params_online_sd001.pkl b/checkpoints/cdp3/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..d91a4e53ef184ca23d91548f0c920672f7427bd8 --- /dev/null +++ b/checkpoints/cdp3/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b40f0e7c44c121776f87a9ab86a252456cf491b3739191519f6553e816ed4926 +size 50383832 diff --git a/checkpoints/cdp3/params_online_sd002.pkl b/checkpoints/cdp3/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..ae1451739292527a97d79420676030374e0f57d2 --- /dev/null +++ b/checkpoints/cdp3/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:078b8f307855b90cd38564183131539a2442e116c6f8efa2d08ee46ece6f36f4 +size 50383832 diff --git a/checkpoints/cdp3/params_online_sd003.pkl b/checkpoints/cdp3/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..49bc524f5871f9c60c20e2e76f0c3a2566e09d04 --- /dev/null +++ b/checkpoints/cdp3/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a493c0b20a732cbffb24badf078e19f7c21dc1a4fac50e6a29785fd43e93e14 +size 50383832 diff --git a/checkpoints/cdp3/params_online_sd004.pkl b/checkpoints/cdp3/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..8410641d9d7be4cd7038ba69c207a501fb55b177 --- /dev/null +++ b/checkpoints/cdp3/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91720c4e466d2c14d60bec45f67f56e7f3cb5eec0340982b972b797c7a34f899 +size 50383832 diff --git a/checkpoints/cdp4/benchmark_summary.txt b/checkpoints/cdp4/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..21b9d3a72dceb618bdd1557aa1030c79c8741558 --- /dev/null +++ b/checkpoints/cdp4/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: cube-double-play-singletask-task4-v0 +Agent: offline +Seed: 3 + +Evaluation (50 episodes): + Success Rate: 100.0% + Mean Return: -267.8 +======================================== diff --git a/checkpoints/cdp4/params_online_sd000.pkl b/checkpoints/cdp4/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..14e707e2c1014f41fa5f94884d7d25a2112cde47 --- /dev/null +++ b/checkpoints/cdp4/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:784710e4e72cef99b11f503ec5e32575e8dd1a2414f74bda68349d237d44d6b0 +size 50383832 diff --git a/checkpoints/cdp4/params_online_sd001.pkl b/checkpoints/cdp4/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..2d8199a47af6da73b6eec9896862bd97d5f3918e --- /dev/null +++ b/checkpoints/cdp4/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53396bdc7af4b1fda853514ef60194dd2d8325e3f0697de3d66209fe26704414 +size 50383832 diff --git a/checkpoints/cdp4/params_online_sd002.pkl b/checkpoints/cdp4/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..3ed4956d196b87ad630210274030f46411f314dd --- /dev/null +++ b/checkpoints/cdp4/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e853b8ea0169f089c9dc3d816960c703a20a86b30cc20816bcd0472ffca1294e +size 50383832 diff --git a/checkpoints/cdp4/params_online_sd003.pkl b/checkpoints/cdp4/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0f60cc10b97f862bc3fa74170b1c5184401512c8 --- /dev/null +++ b/checkpoints/cdp4/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93fe68fb13fac1cc8fb92c03c5fce38fa8d764f919dcb5d932b1035bb0d03c88 +size 50383832 diff --git a/checkpoints/cdp4/params_online_sd004.pkl b/checkpoints/cdp4/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..6cda1b882da73b46d17f885415457d60609c9026 --- /dev/null +++ b/checkpoints/cdp4/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c5917eba397973f5785ccbbec88b7183b42dcd84e4098e6f336e959fc7337b5 +size 50383832 diff --git a/checkpoints/ctrp3/benchmark_summary.txt b/checkpoints/ctrp3/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..01af332992a8e26c5467b0ab30982b34453046e5 --- /dev/null +++ b/checkpoints/ctrp3/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: cube-triple-play-singletask-task3-v0 +Agent: offline +Seed: 4 + +Evaluation (50 episodes): + Success Rate: 76.0% + Mean Return: -906.7 +======================================== diff --git a/checkpoints/ctrp3/params_online_sd000.pkl b/checkpoints/ctrp3/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..21d3185ce3f5ed1d47b2dbc056f0e15b73263739 --- /dev/null +++ b/checkpoints/ctrp3/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5301c1058a6cf086f7f36552c3d6b12afea012c982d03c7e149a4e6e4cb6b358 +size 50660312 diff --git a/checkpoints/ctrp3/params_online_sd001.pkl b/checkpoints/ctrp3/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..8ea9be0afe33ccd95a1bcb67aed62168e189bc0a --- /dev/null +++ b/checkpoints/ctrp3/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:672a809ebb1a65f47f223506c12771a653fb870d6d557e500c1fc098a58c6370 +size 50660312 diff --git a/checkpoints/ctrp3/params_online_sd002.pkl b/checkpoints/ctrp3/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..163e61304d2c3dfce73d45d75466c38aa9952a9c --- /dev/null +++ b/checkpoints/ctrp3/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63bb9a045a22bbe2a18a65d462aceff332d6dfb3fab725299d513599b250a60d +size 50660312 diff --git a/checkpoints/ctrp3/params_online_sd003.pkl b/checkpoints/ctrp3/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..b317e36b3d7e39837778f96de3164a27c6ffb2b8 --- /dev/null +++ b/checkpoints/ctrp3/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ab90eb5274be7208d8dc9b706cc9ce92af98eeeb0a2da954d4a301e818c628f +size 50660312 diff --git a/checkpoints/ctrp3/params_online_sd004.pkl b/checkpoints/ctrp3/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..b1ac0fabb2c73e4193a6b5c0f50f3de59e00e529 --- /dev/null +++ b/checkpoints/ctrp3/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91b1036c93edb9fcd18e16f6e8f6a2bd664e518b9e2bb05e6c014817821175ef +size 50660312 diff --git a/checkpoints/ctrp4/benchmark_summary.txt b/checkpoints/ctrp4/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8c1b8b246cdc79a70c41eac6ff3a84083c59a2e --- /dev/null +++ b/checkpoints/ctrp4/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: cube-triple-play-singletask-task4-v0 +Agent: offline +Seed: 0 + +Evaluation (50 episodes): + Success Rate: 80.0% + Mean Return: -1032.8 +======================================== diff --git a/checkpoints/ctrp4/params_online_sd000.pkl b/checkpoints/ctrp4/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..7cab76fc85450bc6a765324d28828fe6f1e247ec --- /dev/null +++ b/checkpoints/ctrp4/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa73596fe1d120a43d9b1910612bece3c8512e1d9357b07cc14bc542d914b54 +size 50660312 diff --git a/checkpoints/ctrp4/params_online_sd001.pkl b/checkpoints/ctrp4/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..52d726cde507d4c7cee0e19fc74210a2d011f85b --- /dev/null +++ b/checkpoints/ctrp4/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:013123b89c22632fcae07877e24b959d7e61db2d5b8122e92ffe51224b4b79ef +size 50660312 diff --git a/checkpoints/ctrp4/params_online_sd002.pkl b/checkpoints/ctrp4/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..54690d300943ee235128f365496d9ca80df63568 --- /dev/null +++ b/checkpoints/ctrp4/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17dfc1d934074cd7f25330046c4057bf205302a3a5c16063942a3a32a6aeedb1 +size 50660312 diff --git a/checkpoints/ctrp4/params_online_sd003.pkl b/checkpoints/ctrp4/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..1fec5693eb93f38b0c5d94d91e0e57cbce9f602f --- /dev/null +++ b/checkpoints/ctrp4/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:962009aa526ccd8ac857acd69c934339b39db43b973202c948d16f4b05c72b0b +size 50660312 diff --git a/checkpoints/ctrp4/params_online_sd004.pkl b/checkpoints/ctrp4/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..a134b42b36f6f9dbb83a0cb11b1767426077a728 --- /dev/null +++ b/checkpoints/ctrp4/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15509620fbc803b5fa88d30f2db60998a58c44dd4b65778ada8b614978e8d3a4 +size 50660312 diff --git a/checkpoints/hm3/benchmark_summary.txt b/checkpoints/hm3/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..11c3bc2fb2ea3df56c084f8c08854c73fb68c968 --- /dev/null +++ b/checkpoints/hm3/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: humanoidmaze-medium-navigate-singletask-task3-v0 +Agent: offline +Seed: 2 + +Evaluation (50 episodes): + Success Rate: 60.0% + Mean Return: -1722.0 +======================================== diff --git a/checkpoints/hm3/params_online_sd000.pkl b/checkpoints/hm3/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..179e233025cf098b838112f5d394a240b021094d --- /dev/null +++ b/checkpoints/hm3/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42309fdd9835bbf6fa5a0b31030ae1b477de399ee80e79b98c00ee8096f70ef6 +size 54316991 diff --git a/checkpoints/hm3/params_online_sd001.pkl b/checkpoints/hm3/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..8279eba70e907ed0ddeaa1d2b58c03ec04dffb65 --- /dev/null +++ b/checkpoints/hm3/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ed72e5b3c5ae77bb4977fce4a730ce5d11af745a4e738852d4bbab15eb034a9 +size 54316991 diff --git a/checkpoints/hm3/params_online_sd002.pkl b/checkpoints/hm3/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..bd59bf4d74fc1d37a608d02dac256d49a8db64c2 --- /dev/null +++ b/checkpoints/hm3/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1dfd74b50df8ec61858b5629174f4ee2aa1540cc3d73530dbc874e00e8e534e +size 54316991 diff --git a/checkpoints/hm3/params_online_sd003.pkl b/checkpoints/hm3/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..88ca50e52b1a403609bdfd3036419ebdefc704b7 --- /dev/null +++ b/checkpoints/hm3/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc39ccf75691d18e0dd701efca63111a15fbeb6035744188c6c701ad265d431 +size 54316991 diff --git a/checkpoints/hm3/params_online_sd004.pkl b/checkpoints/hm3/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..32c3abd00ffced5d9cc14ea0488f6864c2684579 --- /dev/null +++ b/checkpoints/hm3/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45cf7e7998e1faa8fe8d367968a67e1eac53ed7ebd6cce467c823bda521d18b3 +size 54316991 diff --git a/checkpoints/hm4/benchmark_summary.txt b/checkpoints/hm4/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..063f83f84032a50d3a4ae2e76d5c5e9a796b8a11 --- /dev/null +++ b/checkpoints/hm4/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: humanoidmaze-medium-navigate-singletask-task4-v0 +Agent: offline +Seed: 3 + +Evaluation (50 episodes): + Success Rate: 4.0% + Mean Return: -1990.7 +======================================== diff --git a/checkpoints/hm4/params_online_sd000.pkl b/checkpoints/hm4/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..1a3f4093ec934e05c9f276e817307caaa16ba99c --- /dev/null +++ b/checkpoints/hm4/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2c3bdc67c93a18a4cc00680a0aca78d897bd54c33e13695dffbe34886cd2ba7 +size 54316991 diff --git a/checkpoints/hm4/params_online_sd001.pkl b/checkpoints/hm4/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..1a2bbda78a4aefbb75591352472c37a13361e07b --- /dev/null +++ b/checkpoints/hm4/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4438014c89224cb082ec621af4543c668e3da6bfe42747022447f8cb592a73f +size 54316991 diff --git a/checkpoints/hm4/params_online_sd002.pkl b/checkpoints/hm4/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..4642e1c5b752ade2fe2afd8a5bdf6b74ffc3a239 --- /dev/null +++ b/checkpoints/hm4/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0965e3abe1cb76906a0eaf9ce6112a8b8867d6d59e16997de83197a229b8a8b7 +size 54316991 diff --git a/checkpoints/hm4/params_online_sd003.pkl b/checkpoints/hm4/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..b9b3cb0e7d8422b4d32a6cc9818adb461eb80726 --- /dev/null +++ b/checkpoints/hm4/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:760b1d0c594a44b5783df69b0ae82bdc2aff36b6b426d30b981c8511a5ef1913 +size 54316991 diff --git a/checkpoints/hm4/params_online_sd004.pkl b/checkpoints/hm4/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..c2f2e1e822c446eda059c49d75edff2cec2cd0e3 --- /dev/null +++ b/checkpoints/hm4/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e47de7cc7629386a795d31feb1d82d795dc6424f4289031d0230d662dd1d24bd +size 54316991 diff --git a/checkpoints/sc4/benchmark_summary.txt b/checkpoints/sc4/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ad869612cd7647a556046d0c85b2336fc39e82b --- /dev/null +++ b/checkpoints/sc4/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: scene-play-singletask-task4-v0 +Agent: offline +Seed: 3 + +Evaluation (50 episodes): + Success Rate: 100.0% + Mean Return: -179.0 +======================================== diff --git a/checkpoints/sc4/params_online_sd000.pkl b/checkpoints/sc4/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..3ea4c2d16b31cc444e3a4216d697f9527bc32eae --- /dev/null +++ b/checkpoints/sc4/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5cd82ca01f0b353931d682e2424af0fc7a9b41bc00f96b93db216b47676c9b2 +size 50475992 diff --git a/checkpoints/sc4/params_online_sd001.pkl b/checkpoints/sc4/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..8a5833571a82659b92ca4f8fbc5e18d5f8f5ff3c --- /dev/null +++ b/checkpoints/sc4/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55090db106d33f97a9eee606f774360eb36bb24ae8b369037934df99b2354ba6 +size 50475992 diff --git a/checkpoints/sc4/params_online_sd002.pkl b/checkpoints/sc4/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0b3d1bf088f14b42898a4e1e0b85dcac405a6cee --- /dev/null +++ b/checkpoints/sc4/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c590811c3a4d92d332093cdb62a1a433611a18b7db04e15d15789e6ce0963a3 +size 50475992 diff --git a/checkpoints/sc4/params_online_sd003.pkl b/checkpoints/sc4/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..ad59b28121bd759c9ee9d4ce072c638633695b00 --- /dev/null +++ b/checkpoints/sc4/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cbf9f39f05748e4acef7bdc483154ea9790d05849fe44e5d6b2d9b53d81a049 +size 50475992 diff --git a/checkpoints/sc4/params_online_sd004.pkl b/checkpoints/sc4/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..443f59f9c148743eda09447f68d6e24bfe2c2de7 --- /dev/null +++ b/checkpoints/sc4/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:113b59fc2a484aa4ccb66e75aa0c9f5a2ea063c3e91b28c55953f5abf28d082e +size 50475992 diff --git a/checkpoints/sc5/benchmark_summary.txt b/checkpoints/sc5/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..423785dc237a97111f299d1b221fb3ed070c23b2 --- /dev/null +++ b/checkpoints/sc5/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: scene-play-singletask-task5-v0 +Agent: offline +Seed: 4 + +Evaluation (50 episodes): + Success Rate: 100.0% + Mean Return: -442.9 +======================================== diff --git a/checkpoints/sc5/params_online_sd000.pkl b/checkpoints/sc5/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..c34b5281ef70056de7a4c89bcf237e10b916f09e --- /dev/null +++ b/checkpoints/sc5/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba54454f218e4dba6b9b9ca8d7cb07d215b311a9af913b252c5a1f6c6a3c8c08 +size 50475992 diff --git a/checkpoints/sc5/params_online_sd001.pkl b/checkpoints/sc5/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..e6d1f45ca84b410ec48ff0724b04db7d673607fe --- /dev/null +++ b/checkpoints/sc5/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fde5aa0d1dc2dc6d25baed465505c175205ad171d9b0f41c5e4b32276a5418c +size 50475992 diff --git a/checkpoints/sc5/params_online_sd002.pkl b/checkpoints/sc5/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..e8847b58f41ead2e408ceeca8451d392b3fbeb6d --- /dev/null +++ b/checkpoints/sc5/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d13a264f076b53e9d16987cdb2f9153134cc7265c30136d6d8b316355980ce6 +size 50475992 diff --git a/checkpoints/sc5/params_online_sd003.pkl b/checkpoints/sc5/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..e4add9d389ba61c85291de46eb9703c7e25d08ba --- /dev/null +++ b/checkpoints/sc5/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a274ed8b34e364de991d15b681e436814cb3cf9735cc9488043d56fee431043 +size 50475992 diff --git a/checkpoints/sc5/params_online_sd004.pkl b/checkpoints/sc5/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..66f20750380729f87c54229f61fe1a334e61ff32 --- /dev/null +++ b/checkpoints/sc5/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e692fcf477fd5fd15975780cbb0e735f13984b302c8d05cb63858328fd28cf72 +size 50475992 diff --git a/checkpoints/square/benchmark_summary.txt b/checkpoints/square/benchmark_summary.txt new file mode 100644 index 0000000000000000000000000000000000000000..906dbc9c64291464b1a66d5d519361baa9990d54 --- /dev/null +++ b/checkpoints/square/benchmark_summary.txt @@ -0,0 +1,11 @@ +======================================== + FINAL SUMMARY +======================================== +Environment: square-mh-low_dim +Agent: offline +Seed: 4 + +Evaluation (50 episodes): + Success Rate: 94.0% + Mean Return: 0.9 +======================================== diff --git a/checkpoints/square/params_online_sd000.pkl b/checkpoints/square/params_online_sd000.pkl new file mode 100644 index 0000000000000000000000000000000000000000..2a170944f1e21d4eda57e60d04135f2a055c3687 --- /dev/null +++ b/checkpoints/square/params_online_sd000.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b6607e5cb5f4d46aa7db097129eedad136da8e79d994762ca46bc214a0dc2cb +size 50322539 diff --git a/checkpoints/square/params_online_sd001.pkl b/checkpoints/square/params_online_sd001.pkl new file mode 100644 index 0000000000000000000000000000000000000000..8f3592aabde3d032bf0264e55a4a88ec4b992d9b --- /dev/null +++ b/checkpoints/square/params_online_sd001.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:650ae0498e0fa91dab7b99ec341d790ca7ab6620dda73c91c42f78e4df6bcb04 +size 50322539 diff --git a/checkpoints/square/params_online_sd002.pkl b/checkpoints/square/params_online_sd002.pkl new file mode 100644 index 0000000000000000000000000000000000000000..ad539b1add743c1abcf5abb7b19423818b5eb936 --- /dev/null +++ b/checkpoints/square/params_online_sd002.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c75185b771c71fbffc7d623c121800c4feb5134d407bf7199b8b691cb92876 +size 50322539 diff --git a/checkpoints/square/params_online_sd003.pkl b/checkpoints/square/params_online_sd003.pkl new file mode 100644 index 0000000000000000000000000000000000000000..290040ac3f267d6874cdc9f835ba7b8f53f7b609 --- /dev/null +++ b/checkpoints/square/params_online_sd003.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4610174e1eb3f76cc8c89fa55f6e24fc9692e7e3a0e52ab549e778c758c27511 +size 50322539 diff --git a/checkpoints/square/params_online_sd004.pkl b/checkpoints/square/params_online_sd004.pkl new file mode 100644 index 0000000000000000000000000000000000000000..25f804ace53d339a55b7bab65bb34dcb399b7e23 --- /dev/null +++ b/checkpoints/square/params_online_sd004.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d4953b2d881757154bf67fcd65c093d27561cda5d4fd92ff463181e589a099a +size 50322539