sgoodfriend commited on
Commit
41e80f6
1 Parent(s): 69aa193

PPO playing Acrobot-v1 from https://github.com/sgoodfriend/rl-algo-impls/tree/5598ebc4b03054f16eebe76792486ba7bcacfc5c

Browse files
benchmarks/colab_benchmark.ipynb CHANGED
@@ -5,7 +5,7 @@
5
  "colab": {
6
  "provenance": [],
7
  "machine_shape": "hm",
8
- "authorship_tag": "ABX9TyMJFprw7XNl/BqbKAHd/483",
9
  "include_colab_link": true
10
  },
11
  "kernelspec": {
@@ -70,22 +70,7 @@
70
  "cell_type": "code",
71
  "source": [
72
  "%%capture\n",
73
- "!mkdir -p ~/.ssh\n",
74
- "\n",
75
- "with open(\"/root/.ssh/id_ed25519\", mode=\"w\") as f:\n",
76
- " f.write(\"\"\"-----BEGIN OPENSSH PRIVATE KEY-----\n",
77
- "b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAAAMwAAAAtzc2gtZW\n",
78
- "QyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVAAAAKA4W3D3OFtw\n",
79
- "9wAAAAtzc2gtZWQyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVA\n",
80
- "AAAEA4SPGDm0/gofiOYXPTAi1Oxmw4mTppG2GdNgdMwMiDaSQh6kfpP3S6aHKnz5uSZKmW\n",
81
- "q2HX/7LGe78NrHrUqVJUAAAAGmdvb2RmcmllbmQuc2NvdHRAZ21haWwuY29tAQID\n",
82
- "-----END OPENSSH PRIVATE KEY-----\n",
83
- "\"\"\"\n",
84
- ")\n",
85
- "\n",
86
- "!ssh-keyscan -t ed25519 github.com >> ~/.ssh/known_hosts\n",
87
- "!chmod go-rwx /root/.ssh/id_ed25519\n",
88
- "!git clone git@github.com:sgoodfriend/rl-algo-impls.git"
89
  ],
90
  "metadata": {
91
  "id": "k5ynTV25hdAf"
 
5
  "colab": {
6
  "provenance": [],
7
  "machine_shape": "hm",
8
+ "authorship_tag": "ABX9TyOGIH7rqgasim3Sz7b1rpoE",
9
  "include_colab_link": true
10
  },
11
  "kernelspec": {
 
70
  "cell_type": "code",
71
  "source": [
72
  "%%capture\n",
73
+ "!git clone https://github.com/sgoodfriend/rl-algo-impls.git"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
74
  ],
75
  "metadata": {
76
  "id": "k5ynTV25hdAf"
colab_enjoy.ipynb CHANGED
@@ -5,7 +5,7 @@
5
  "colab": {
6
  "provenance": [],
7
  "machine_shape": "hm",
8
- "authorship_tag": "ABX9TyM1iRYRLhijbxWxPLk9Ba7f",
9
  "include_colab_link": true
10
  },
11
  "kernelspec": {
@@ -90,22 +90,7 @@
90
  "cell_type": "code",
91
  "source": [
92
  "%%capture\n",
93
- "!mkdir -p ~/.ssh\n",
94
- "\n",
95
- "with open(\"/root/.ssh/id_ed25519\", mode=\"w\") as f:\n",
96
- " f.write(\"\"\"-----BEGIN OPENSSH PRIVATE KEY-----\n",
97
- "b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAAAMwAAAAtzc2gtZW\n",
98
- "QyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVAAAAKA4W3D3OFtw\n",
99
- "9wAAAAtzc2gtZWQyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVA\n",
100
- "AAAEA4SPGDm0/gofiOYXPTAi1Oxmw4mTppG2GdNgdMwMiDaSQh6kfpP3S6aHKnz5uSZKmW\n",
101
- "q2HX/7LGe78NrHrUqVJUAAAAGmdvb2RmcmllbmQuc2NvdHRAZ21haWwuY29tAQID\n",
102
- "-----END OPENSSH PRIVATE KEY-----\n",
103
- "\"\"\"\n",
104
- ")\n",
105
- "\n",
106
- "!ssh-keyscan -t ed25519 github.com >> ~/.ssh/known_hosts\n",
107
- "!chmod go-rwx /root/.ssh/id_ed25519\n",
108
- "!git clone git@github.com:sgoodfriend/rl-algo-impls.git"
109
  ],
110
  "metadata": {
111
  "id": "k5ynTV25hdAf"
 
5
  "colab": {
6
  "provenance": [],
7
  "machine_shape": "hm",
8
+ "authorship_tag": "ABX9TyN6S7kyJKrM5x0OOiN+CgTc",
9
  "include_colab_link": true
10
  },
11
  "kernelspec": {
 
90
  "cell_type": "code",
91
  "source": [
92
  "%%capture\n",
93
+ "!git clone https://github.com/sgoodfriend/rl-algo-impls.git"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
94
  ],
95
  "metadata": {
96
  "id": "k5ynTV25hdAf"
colab_train.ipynb CHANGED
@@ -5,7 +5,7 @@
5
  "colab": {
6
  "provenance": [],
7
  "machine_shape": "hm",
8
- "authorship_tag": "ABX9TyNGs5TudweZiYKySQxg6H+K",
9
  "include_colab_link": true
10
  },
11
  "kernelspec": {
@@ -75,7 +75,7 @@
75
  "metadata": {
76
  "id": "jKL_NFhVOjSc"
77
  },
78
- "execution_count": 2,
79
  "outputs": []
80
  },
81
  {
@@ -92,27 +92,12 @@
92
  "cell_type": "code",
93
  "source": [
94
  "%%capture\n",
95
- "!mkdir -p ~/.ssh\n",
96
- "\n",
97
- "with open(\"/root/.ssh/id_ed25519\", mode=\"w\") as f:\n",
98
- " f.write(\"\"\"-----BEGIN OPENSSH PRIVATE KEY-----\n",
99
- "b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAAAMwAAAAtzc2gtZW\n",
100
- "QyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVAAAAKA4W3D3OFtw\n",
101
- "9wAAAAtzc2gtZWQyNTUxOQAAACAkIepH6T90umhyp8+bkmSplqth1/+yxnu/Dax61KlSVA\n",
102
- "AAAEA4SPGDm0/gofiOYXPTAi1Oxmw4mTppG2GdNgdMwMiDaSQh6kfpP3S6aHKnz5uSZKmW\n",
103
- "q2HX/7LGe78NrHrUqVJUAAAAGmdvb2RmcmllbmQuc2NvdHRAZ21haWwuY29tAQID\n",
104
- "-----END OPENSSH PRIVATE KEY-----\n",
105
- "\"\"\"\n",
106
- ")\n",
107
- "\n",
108
- "!ssh-keyscan -t ed25519 github.com >> ~/.ssh/known_hosts\n",
109
- "!chmod go-rwx /root/.ssh/id_ed25519\n",
110
- "!git clone git@github.com:sgoodfriend/rl-algo-impls.git"
111
  ],
112
  "metadata": {
113
  "id": "k5ynTV25hdAf"
114
  },
115
- "execution_count": 3,
116
  "outputs": []
117
  },
118
  {
@@ -138,7 +123,7 @@
138
  "metadata": {
139
  "id": "nn6EETTc2Ewf"
140
  },
141
- "execution_count": 4,
142
  "outputs": []
143
  },
144
  {
@@ -151,7 +136,7 @@
151
  "metadata": {
152
  "id": "AfZh9rH3yQii"
153
  },
154
- "execution_count": 5,
155
  "outputs": []
156
  },
157
  {
@@ -196,7 +181,7 @@
196
  "metadata": {
197
  "id": "VzemeQJP2NO9"
198
  },
199
- "execution_count": 7,
200
  "outputs": []
201
  },
202
  {
 
5
  "colab": {
6
  "provenance": [],
7
  "machine_shape": "hm",
8
+ "authorship_tag": "ABX9TyMmemQnx6G7GOnn6XBdjgxY",
9
  "include_colab_link": true
10
  },
11
  "kernelspec": {
 
75
  "metadata": {
76
  "id": "jKL_NFhVOjSc"
77
  },
78
+ "execution_count": null,
79
  "outputs": []
80
  },
81
  {
 
92
  "cell_type": "code",
93
  "source": [
94
  "%%capture\n",
95
+ "!git clone https://github.com/sgoodfriend/rl-algo-impls.git"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
96
  ],
97
  "metadata": {
98
  "id": "k5ynTV25hdAf"
99
  },
100
+ "execution_count": null,
101
  "outputs": []
102
  },
103
  {
 
123
  "metadata": {
124
  "id": "nn6EETTc2Ewf"
125
  },
126
+ "execution_count": null,
127
  "outputs": []
128
  },
129
  {
 
136
  "metadata": {
137
  "id": "AfZh9rH3yQii"
138
  },
139
+ "execution_count": null,
140
  "outputs": []
141
  },
142
  {
 
181
  "metadata": {
182
  "id": "VzemeQJP2NO9"
183
  },
184
+ "execution_count": null,
185
  "outputs": []
186
  },
187
  {
huggingface_publish.py CHANGED
@@ -144,7 +144,7 @@ def publish(
144
  api.create_repo(
145
  token=huggingface_token,
146
  repo_id=huggingface_repo,
147
- private=True,
148
  exist_ok=True,
149
  )
150
  repo_url = upload_folder(
 
144
  api.create_repo(
145
  token=huggingface_token,
146
  repo_id=huggingface_repo,
147
+ private=False,
148
  exist_ok=True,
149
  )
150
  repo_url = upload_folder(
replay.meta.json CHANGED
@@ -1 +1 @@
1
- {"content_type": "video/mp4", "encoder_version": {"backend": "ffmpeg", "version": "b'ffmpeg version 5.1.2 Copyright (c) 2000-2022 the FFmpeg developers\\nbuilt with clang version 14.0.6\\nconfiguration: --prefix=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_h_env_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_pl --cc=arm64-apple-darwin20.0.0-clang --cxx=arm64-apple-darwin20.0.0-clang++ --nm=arm64-apple-darwin20.0.0-nm --ar=arm64-apple-darwin20.0.0-ar --disable-doc --disable-openssl --enable-demuxer=dash --enable-hardcoded-tables --enable-libfreetype --enable-libfontconfig --enable-libopenh264 --enable-cross-compile --arch=arm64 --target-os=darwin --cross-prefix=arm64-apple-darwin20.0.0- --host-cc=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_build_env/bin/x86_64-apple-darwin13.4.0-clang --enable-neon --enable-gnutls --enable-libmp3lame --enable-libvpx --enable-pthreads --enable-gpl --enable-libx264 --enable-libx265 --enable-libaom --enable-libsvtav1 --enable-libxml2 --enable-pic --enable-shared --disable-static --enable-version3 --enable-zlib --pkg-config=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_build_env/bin/pkg-config\\nlibavutil 57. 28.100 / 57. 28.100\\nlibavcodec 59. 37.100 / 59. 37.100\\nlibavformat 59. 27.100 / 59. 27.100\\nlibavdevice 59. 7.100 / 59. 7.100\\nlibavfilter 8. 44.100 / 8. 44.100\\nlibswscale 6. 7.100 / 6. 7.100\\nlibswresample 4. 7.100 / 4. 7.100\\nlibpostproc 56. 6.100 / 56. 6.100\\n'", "cmdline": ["ffmpeg", "-nostats", "-loglevel", "error", "-y", "-f", "rawvideo", "-s:v", "500x500", "-pix_fmt", "rgb24", "-framerate", "30", "-i", "-", "-vf", "scale=trunc(iw/2)*2:trunc(ih/2)*2", "-vcodec", "libx264", "-pix_fmt", "yuv420p", "-r", "30", "/var/folders/9g/my5557_91xddp6lx00nkzly80000gn/T/tmptj2x08p5/ppo-Acrobot-v1/replay.mp4"]}, "episode": {"r": -73.0, "l": 74, "t": 1.413602}}
 
1
+ {"content_type": "video/mp4", "encoder_version": {"backend": "ffmpeg", "version": "b'ffmpeg version 5.1.2 Copyright (c) 2000-2022 the FFmpeg developers\\nbuilt with clang version 14.0.6\\nconfiguration: --prefix=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_h_env_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_placehold_pl --cc=arm64-apple-darwin20.0.0-clang --cxx=arm64-apple-darwin20.0.0-clang++ --nm=arm64-apple-darwin20.0.0-nm --ar=arm64-apple-darwin20.0.0-ar --disable-doc --disable-openssl --enable-demuxer=dash --enable-hardcoded-tables --enable-libfreetype --enable-libfontconfig --enable-libopenh264 --enable-cross-compile --arch=arm64 --target-os=darwin --cross-prefix=arm64-apple-darwin20.0.0- --host-cc=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_build_env/bin/x86_64-apple-darwin13.4.0-clang --enable-neon --enable-gnutls --enable-libmp3lame --enable-libvpx --enable-pthreads --enable-gpl --enable-libx264 --enable-libx265 --enable-libaom --enable-libsvtav1 --enable-libxml2 --enable-pic --enable-shared --disable-static --enable-version3 --enable-zlib --pkg-config=/Users/runner/miniforge3/conda-bld/ffmpeg_1671040513231/_build_env/bin/pkg-config\\nlibavutil 57. 28.100 / 57. 28.100\\nlibavcodec 59. 37.100 / 59. 37.100\\nlibavformat 59. 27.100 / 59. 27.100\\nlibavdevice 59. 7.100 / 59. 7.100\\nlibavfilter 8. 44.100 / 8. 44.100\\nlibswscale 6. 7.100 / 6. 7.100\\nlibswresample 4. 7.100 / 4. 7.100\\nlibpostproc 56. 6.100 / 56. 6.100\\n'", "cmdline": ["ffmpeg", "-nostats", "-loglevel", "error", "-y", "-f", "rawvideo", "-s:v", "500x500", "-pix_fmt", "rgb24", "-framerate", "30", "-i", "-", "-vf", "scale=trunc(iw/2)*2:trunc(ih/2)*2", "-vcodec", "libx264", "-pix_fmt", "yuv420p", "-r", "30", "/var/folders/9g/my5557_91xddp6lx00nkzly80000gn/T/tmpa694w53n/ppo-Acrobot-v1/replay.mp4"]}, "episode": {"r": -73.0, "l": 74, "t": 1.308829}}