sgoodfriend
commited on
Commit
•
41e80f6
1
Parent(s):
69aa193
PPO playing Acrobot-v1 from https://github.com/sgoodfriend/rl-algo-impls/tree/5598ebc4b03054f16eebe76792486ba7bcacfc5c
Browse files- benchmarks/colab_benchmark.ipynb +2 -17
- colab_enjoy.ipynb +2 -17
- colab_train.ipynb +7 -22
- huggingface_publish.py +1 -1
- replay.meta.json +1 -1
benchmarks/colab_benchmark.ipynb
CHANGED
@@ -5,7 +5,7 @@
|
|
5 |
"colab": {
|
6 |
"provenance": [],
|
7 |
"machine_shape": "hm",
|
8 |
-
"authorship_tag": "
|
9 |
"include_colab_link": true
|
10 |
},
|
11 |
"kernelspec": {
|
@@ -70,22 +70,7 @@
|
|
70 |
"cell_type": "code",
|
71 |
"source": [
|
72 |
"%%capture\n",
|
73 |
-
"!
|
74 |
-
"\n",
|
75 |
-
"with open(\"/root/.ssh/id_ed25519\", mode=\"w\") as f:\n",
|
76 |
-
" f.write(\"\"\"-----BEGIN OPENSSH PRIVATE KEY-----\n",
|
77 |
-
"b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAAAMwAAAAtzc2gtZW\n",
|
78 |
-
"QyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVAAAAKA4W3D3OFtw\n",
|
79 |
-
"9wAAAAtzc2gtZWQyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVA\n",
|
80 |
-
"AAAEA4SPGDm0/gofiOYXPTAi1Oxmw4mTppG2GdNgdMwMiDaSQh6kfpP3S6aHKnz5uSZKmW\n",
|
81 |
-
"q2HX/7LGe78NrHrUqVJUAAAAGmdvb2RmcmllbmQuc2NvdHRAZ21haWwuY29tAQID\n",
|
82 |
-
"-----END OPENSSH PRIVATE KEY-----\n",
|
83 |
-
"\"\"\"\n",
|
84 |
-
")\n",
|
85 |
-
"\n",
|
86 |
-
"!ssh-keyscan -t ed25519 github.com >> ~/.ssh/known_hosts\n",
|
87 |
-
"!chmod go-rwx /root/.ssh/id_ed25519\n",
|
88 |
-
"!git clone git@github.com:sgoodfriend/rl-algo-impls.git"
|
89 |
],
|
90 |
"metadata": {
|
91 |
"id": "k5ynTV25hdAf"
|
|
|
5 |
"colab": {
|
6 |
"provenance": [],
|
7 |
"machine_shape": "hm",
|
8 |
+
"authorship_tag": "ABX9TyOGIH7rqgasim3Sz7b1rpoE",
|
9 |
"include_colab_link": true
|
10 |
},
|
11 |
"kernelspec": {
|
|
|
70 |
"cell_type": "code",
|
71 |
"source": [
|
72 |
"%%capture\n",
|
73 |
+
"!git clone https://github.com/sgoodfriend/rl-algo-impls.git"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
74 |
],
|
75 |
"metadata": {
|
76 |
"id": "k5ynTV25hdAf"
|
colab_enjoy.ipynb
CHANGED
@@ -5,7 +5,7 @@
|
|
5 |
"colab": {
|
6 |
"provenance": [],
|
7 |
"machine_shape": "hm",
|
8 |
-
"authorship_tag": "
|
9 |
"include_colab_link": true
|
10 |
},
|
11 |
"kernelspec": {
|
@@ -90,22 +90,7 @@
|
|
90 |
"cell_type": "code",
|
91 |
"source": [
|
92 |
"%%capture\n",
|
93 |
-
"!
|
94 |
-
"\n",
|
95 |
-
"with open(\"/root/.ssh/id_ed25519\", mode=\"w\") as f:\n",
|
96 |
-
" f.write(\"\"\"-----BEGIN OPENSSH PRIVATE KEY-----\n",
|
97 |
-
"b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAAAMwAAAAtzc2gtZW\n",
|
98 |
-
"QyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVAAAAKA4W3D3OFtw\n",
|
99 |
-
"9wAAAAtzc2gtZWQyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVA\n",
|
100 |
-
"AAAEA4SPGDm0/gofiOYXPTAi1Oxmw4mTppG2GdNgdMwMiDaSQh6kfpP3S6aHKnz5uSZKmW\n",
|
101 |
-
"q2HX/7LGe78NrHrUqVJUAAAAGmdvb2RmcmllbmQuc2NvdHRAZ21haWwuY29tAQID\n",
|
102 |
-
"-----END OPENSSH PRIVATE KEY-----\n",
|
103 |
-
"\"\"\"\n",
|
104 |
-
")\n",
|
105 |
-
"\n",
|
106 |
-
"!ssh-keyscan -t ed25519 github.com >> ~/.ssh/known_hosts\n",
|
107 |
-
"!chmod go-rwx /root/.ssh/id_ed25519\n",
|
108 |
-
"!git clone git@github.com:sgoodfriend/rl-algo-impls.git"
|
109 |
],
|
110 |
"metadata": {
|
111 |
"id": "k5ynTV25hdAf"
|
|
|
5 |
"colab": {
|
6 |
"provenance": [],
|
7 |
"machine_shape": "hm",
|
8 |
+
"authorship_tag": "ABX9TyN6S7kyJKrM5x0OOiN+CgTc",
|
9 |
"include_colab_link": true
|
10 |
},
|
11 |
"kernelspec": {
|
|
|
90 |
"cell_type": "code",
|
91 |
"source": [
|
92 |
"%%capture\n",
|
93 |
+
"!git clone https://github.com/sgoodfriend/rl-algo-impls.git"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
94 |
],
|
95 |
"metadata": {
|
96 |
"id": "k5ynTV25hdAf"
|
colab_train.ipynb
CHANGED
@@ -5,7 +5,7 @@
|
|
5 |
"colab": {
|
6 |
"provenance": [],
|
7 |
"machine_shape": "hm",
|
8 |
-
"authorship_tag": "
|
9 |
"include_colab_link": true
|
10 |
},
|
11 |
"kernelspec": {
|
@@ -75,7 +75,7 @@
|
|
75 |
"metadata": {
|
76 |
"id": "jKL_NFhVOjSc"
|
77 |
},
|
78 |
-
"execution_count":
|
79 |
"outputs": []
|
80 |
},
|
81 |
{
|
@@ -92,27 +92,12 @@
|
|
92 |
"cell_type": "code",
|
93 |
"source": [
|
94 |
"%%capture\n",
|
95 |
-
"!
|
96 |
-
"\n",
|
97 |
-
"with open(\"/root/.ssh/id_ed25519\", mode=\"w\") as f:\n",
|
98 |
-
" f.write(\"\"\"-----BEGIN OPENSSH PRIVATE KEY-----\n",
|
99 |
-
"b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAAAMwAAAAtzc2gtZW\n",
|
100 |
-
"QyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVAAAAKA4W3D3OFtw\n",
|
101 |
-
"9wAAAAtzc2gtZWQyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVA\n",
|
102 |
-
"AAAEA4SPGDm0/gofiOYXPTAi1Oxmw4mTppG2GdNgdMwMiDaSQh6kfpP3S6aHKnz5uSZKmW\n",
|
103 |
-
"q2HX/7LGe78NrHrUqVJUAAAAGmdvb2RmcmllbmQuc2NvdHRAZ21haWwuY29tAQID\n",
|
104 |
-
"-----END OPENSSH PRIVATE KEY-----\n",
|
105 |
-
"\"\"\"\n",
|
106 |
-
")\n",
|
107 |
-
"\n",
|
108 |
-
"!ssh-keyscan -t ed25519 github.com >> ~/.ssh/known_hosts\n",
|
109 |
-
"!chmod go-rwx /root/.ssh/id_ed25519\n",
|
110 |
-
"!git clone git@github.com:sgoodfriend/rl-algo-impls.git"
|
111 |
],
|
112 |
"metadata": {
|
113 |
"id": "k5ynTV25hdAf"
|
114 |
},
|
115 |
-
"execution_count":
|
116 |
"outputs": []
|
117 |
},
|
118 |
{
|
@@ -138,7 +123,7 @@
|
|
138 |
"metadata": {
|
139 |
"id": "nn6EETTc2Ewf"
|
140 |
},
|
141 |
-
"execution_count":
|
142 |
"outputs": []
|
143 |
},
|
144 |
{
|
@@ -151,7 +136,7 @@
|
|
151 |
"metadata": {
|
152 |
"id": "AfZh9rH3yQii"
|
153 |
},
|
154 |
-
"execution_count":
|
155 |
"outputs": []
|
156 |
},
|
157 |
{
|
@@ -196,7 +181,7 @@
|
|
196 |
"metadata": {
|
197 |
"id": "VzemeQJP2NO9"
|
198 |
},
|
199 |
-
"execution_count":
|
200 |
"outputs": []
|
201 |
},
|
202 |
{
|
|
|
5 |
"colab": {
|
6 |
"provenance": [],
|
7 |
"machine_shape": "hm",
|
8 |
+
"authorship_tag": "ABX9TyMmemQnx6G7GOnn6XBdjgxY",
|
9 |
"include_colab_link": true
|
10 |
},
|
11 |
"kernelspec": {
|
|
|
75 |
"metadata": {
|
76 |
"id": "jKL_NFhVOjSc"
|
77 |
},
|
78 |
+
"execution_count": null,
|
79 |
"outputs": []
|
80 |
},
|
81 |
{
|
|
|
92 |
"cell_type": "code",
|
93 |
"source": [
|
94 |
"%%capture\n",
|
95 |
+
"!git clone https://github.com/sgoodfriend/rl-algo-impls.git"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
96 |
],
|
97 |
"metadata": {
|
98 |
"id": "k5ynTV25hdAf"
|
99 |
},
|
100 |
+
"execution_count": null,
|
101 |
"outputs": []
|
102 |
},
|
103 |
{
|
|
|
123 |
"metadata": {
|
124 |
"id": "nn6EETTc2Ewf"
|
125 |
},
|
126 |
+
"execution_count": null,
|
127 |
"outputs": []
|
128 |
},
|
129 |
{
|
|
|
136 |
"metadata": {
|
137 |
"id": "AfZh9rH3yQii"
|
138 |
},
|
139 |
+
"execution_count": null,
|
140 |
"outputs": []
|
141 |
},
|
142 |
{
|
|
|
181 |
"metadata": {
|
182 |
"id": "VzemeQJP2NO9"
|
183 |
},
|
184 |
+
"execution_count": null,
|
185 |
"outputs": []
|
186 |
},
|
187 |
{
|
huggingface_publish.py
CHANGED
@@ -144,7 +144,7 @@ def publish(
|
|
144 |
api.create_repo(
|
145 |
token=huggingface_token,
|
146 |
repo_id=huggingface_repo,
|
147 |
-
private=
|
148 |
exist_ok=True,
|
149 |
)
|
150 |
repo_url = upload_folder(
|
|
|
144 |
api.create_repo(
|
145 |
token=huggingface_token,
|
146 |
repo_id=huggingface_repo,
|
147 |
+
private=False,
|
148 |
exist_ok=True,
|
149 |
)
|
150 |
repo_url = upload_folder(
|
replay.meta.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"content_type": "video/mp4", "encoder_version": {"backend": "ffmpeg", "version": "b'ffmpeg version 5.1.2 Copyright (c) 2000-2022 the FFmpeg developers\\nbuilt with clang version 14.0.6\\nconfiguration: --prefix=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_h_env_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_pl --cc=arm64-apple-darwin20.0.0-clang --cxx=arm64-apple-darwin20.0.0-clang++ --nm=arm64-apple-darwin20.0.0-nm --ar=arm64-apple-darwin20.0.0-ar --disable-doc --disable-openssl --enable-demuxer=dash --enable-hardcoded-tables --enable-libfreetype --enable-libfontconfig --enable-libopenh264 --enable-cross-compile --arch=arm64 --target-os=darwin --cross-prefix=arm64-apple-darwin20.0.0- --host-cc=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_build_env/bin/x86_64-apple-darwin13.4.0-clang --enable-neon --enable-gnutls --enable-libmp3lame --enable-libvpx --enable-pthreads --enable-gpl --enable-libx264 --enable-libx265 --enable-libaom --enable-libsvtav1 --enable-libxml2 --enable-pic --enable-shared --disable-static --enable-version3 --enable-zlib --pkg-config=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_build_env/bin/pkg-config\\nlibavutil 57. 28.100 / 57. 28.100\\nlibavcodec 59. 37.100 / 59. 37.100\\nlibavformat 59. 27.100 / 59. 27.100\\nlibavdevice 59. 7.100 / 59. 7.100\\nlibavfilter 8. 44.100 / 8. 44.100\\nlibswscale 6. 7.100 / 6. 7.100\\nlibswresample 4. 7.100 / 4. 7.100\\nlibpostproc 56. 6.100 / 56. 6.100\\n'", "cmdline": ["ffmpeg", "-nostats", "-loglevel", "error", "-y", "-f", "rawvideo", "-s:v", "500x500", "-pix_fmt", "rgb24", "-framerate", "30", "-i", "-", "-vf", "scale=trunc(iw/2)*2:trunc(ih/2)*2", "-vcodec", "libx264", "-pix_fmt", "yuv420p", "-r", "30", "/var/folders/9g/my5557_91xddp6lx00nkzly80000gn/T/
|
|
|
1 |
+
{"content_type": "video/mp4", "encoder_version": {"backend": "ffmpeg", "version": "b'ffmpeg version 5.1.2 Copyright (c) 2000-2022 the FFmpeg developers\\nbuilt with clang version 14.0.6\\nconfiguration: --prefix=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_h_env_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_pl --cc=arm64-apple-darwin20.0.0-clang --cxx=arm64-apple-darwin20.0.0-clang++ --nm=arm64-apple-darwin20.0.0-nm --ar=arm64-apple-darwin20.0.0-ar --disable-doc --disable-openssl --enable-demuxer=dash --enable-hardcoded-tables --enable-libfreetype --enable-libfontconfig --enable-libopenh264 --enable-cross-compile --arch=arm64 --target-os=darwin --cross-prefix=arm64-apple-darwin20.0.0- --host-cc=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_build_env/bin/x86_64-apple-darwin13.4.0-clang --enable-neon --enable-gnutls --enable-libmp3lame --enable-libvpx --enable-pthreads --enable-gpl --enable-libx264 --enable-libx265 --enable-libaom --enable-libsvtav1 --enable-libxml2 --enable-pic --enable-shared --disable-static --enable-version3 --enable-zlib --pkg-config=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_build_env/bin/pkg-config\\nlibavutil 57. 28.100 / 57. 28.100\\nlibavcodec 59. 37.100 / 59. 37.100\\nlibavformat 59. 27.100 / 59. 27.100\\nlibavdevice 59. 7.100 / 59. 7.100\\nlibavfilter 8. 44.100 / 8. 44.100\\nlibswscale 6. 7.100 / 6. 7.100\\nlibswresample 4. 7.100 / 4. 7.100\\nlibpostproc 56. 6.100 / 56. 6.100\\n'", "cmdline": ["ffmpeg", "-nostats", "-loglevel", "error", "-y", "-f", "rawvideo", "-s:v", "500x500", "-pix_fmt", "rgb24", "-framerate", "30", "-i", "-", "-vf", "scale=trunc(iw/2)*2:trunc(ih/2)*2", "-vcodec", "libx264", "-pix_fmt", "yuv420p", "-r", "30", "/var/folders/9g/my5557_91xddp6lx00nkzly80000gn/T/tmpa694w53n/ppo-Acrobot-v1/replay.mp4"]}, "episode": {"r": -73.0, "l": 74, "t": 1.308829}}
|