gagan3012 commited on
Commit
80c4790
1 Parent(s): 9be8301

Create t5s.ipynb

Browse files
Files changed (1) hide show
  1. notebooks/t5s.ipynb +823 -0
notebooks/t5s.ipynb ADDED
@@ -0,0 +1,823 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "nbformat": 4,
3
+ "nbformat_minor": 0,
4
+ "metadata": {
5
+ "colab": {
6
+ "name": "t5s.ipynb",
7
+ "provenance": []
8
+ },
9
+ "kernelspec": {
10
+ "name": "python3",
11
+ "display_name": "Python 3"
12
+ },
13
+ "language_info": {
14
+ "name": "python"
15
+ }
16
+ },
17
+ "cells": [
18
+ {
19
+ "cell_type": "code",
20
+ "metadata": {
21
+ "colab": {
22
+ "base_uri": "https://localhost:8080/",
23
+ "height": 1000
24
+ },
25
+ "id": "J5FugqkVrf-P",
26
+ "outputId": "4082375a-33c4-448f-a618-613224ae02f8"
27
+ },
28
+ "source": [
29
+ "!pip install t5s --upgrade"
30
+ ],
31
+ "execution_count": 1,
32
+ "outputs": [
33
+ {
34
+ "output_type": "stream",
35
+ "text": [
36
+ "Collecting t5s\n",
37
+ " Downloading t5s-1.0.4-py3-none-any.whl (17 kB)\n",
38
+ "Collecting pytorch-lightning==1.3.5\n",
39
+ " Downloading pytorch_lightning-1.3.5-py3-none-any.whl (808 kB)\n",
40
+ "\u001b[K |████████████████████████████████| 808 kB 8.2 MB/s \n",
41
+ "\u001b[?25hCollecting dagshub==0.1.7\n",
42
+ " Downloading dagshub-0.1.7-py3-none-any.whl (9.6 kB)\n",
43
+ "Collecting streamlit==0.85.1\n",
44
+ " Downloading streamlit-0.85.1-py2.py3-none-any.whl (7.9 MB)\n",
45
+ "\u001b[K |████████████████████████████████| 7.9 MB 53.0 MB/s \n",
46
+ "\u001b[?25hRequirement already satisfied: click in /usr/local/lib/python3.7/dist-packages (from t5s) (7.1.2)\n",
47
+ "Requirement already satisfied: coverage in /usr/local/lib/python3.7/dist-packages (from t5s) (3.7.1)\n",
48
+ "Collecting numpy==1.19.2\n",
49
+ " Downloading numpy-1.19.2-cp37-cp37m-manylinux2010_x86_64.whl (14.5 MB)\n",
50
+ "\u001b[K |████████████████████████████████| 14.5 MB 28 kB/s \n",
51
+ "\u001b[?25hRequirement already satisfied: pyyaml in /usr/local/lib/python3.7/dist-packages (from t5s) (3.13)\n",
52
+ "Collecting awscli\n",
53
+ " Downloading awscli-1.20.18-py3-none-any.whl (3.7 MB)\n",
54
+ "\u001b[K |████████████████████████████████| 3.7 MB 53.2 MB/s \n",
55
+ "\u001b[?25hRequirement already satisfied: pandas==1.1.5 in /usr/local/lib/python3.7/dist-packages (from t5s) (1.1.5)\n",
56
+ "Requirement already satisfied: torch==1.9.0 in /usr/local/lib/python3.7/dist-packages (from t5s) (1.9.0+cu102)\n",
57
+ "Collecting transformers==4.9.0\n",
58
+ " Downloading transformers-4.9.0-py3-none-any.whl (2.6 MB)\n",
59
+ "\u001b[K |████████████████████████████████| 2.6 MB 49.8 MB/s \n",
60
+ "\u001b[?25hCollecting flake8\n",
61
+ " Downloading flake8-3.9.2-py2.py3-none-any.whl (73 kB)\n",
62
+ "\u001b[K |████████████████████████████████| 73 kB 2.2 MB/s \n",
63
+ "\u001b[?25hCollecting datasets==1.10.2\n",
64
+ " Downloading datasets-1.10.2-py3-none-any.whl (542 kB)\n",
65
+ "\u001b[K |████████████████████████████████| 542 kB 50.5 MB/s \n",
66
+ "\u001b[?25hCollecting dvc==2.5.4\n",
67
+ " Downloading dvc-2.5.4-py3-none-any.whl (638 kB)\n",
68
+ "\u001b[K |████████████████████████████████| 638 kB 67.4 MB/s \n",
69
+ "\u001b[?25hCollecting black\n",
70
+ " Downloading black-21.7b0-py3-none-any.whl (141 kB)\n",
71
+ "\u001b[K |████████████████████████████████| 141 kB 92.8 MB/s \n",
72
+ "\u001b[?25hCollecting mlflow==1.19.0\n",
73
+ " Downloading mlflow-1.19.0-py3-none-any.whl (14.4 MB)\n",
74
+ "\u001b[K |████████████████████████████████| 14.4 MB 63 kB/s \n",
75
+ "\u001b[?25hCollecting rouge-score==0.0.4\n",
76
+ " Downloading rouge_score-0.0.4-py2.py3-none-any.whl (22 kB)\n",
77
+ "Collecting python-dotenv>=0.5.1\n",
78
+ " Downloading python_dotenv-0.19.0-py2.py3-none-any.whl (17 kB)\n",
79
+ "Collecting pyyaml\n",
80
+ " Downloading PyYAML-5.4.1-cp37-cp37m-manylinux1_x86_64.whl (636 kB)\n",
81
+ "\u001b[K |████████████████████████████████| 636 kB 71.8 MB/s \n",
82
+ "\u001b[?25hRequirement already satisfied: importlib-metadata in /usr/local/lib/python3.7/dist-packages (from datasets==1.10.2->t5s) (4.6.1)\n",
83
+ "Requirement already satisfied: packaging in /usr/local/lib/python3.7/dist-packages (from datasets==1.10.2->t5s) (21.0)\n",
84
+ "Requirement already satisfied: requests>=2.19.0 in /usr/local/lib/python3.7/dist-packages (from datasets==1.10.2->t5s) (2.23.0)\n",
85
+ "Requirement already satisfied: pyarrow!=4.0.0,>=1.0.0 in /usr/local/lib/python3.7/dist-packages (from datasets==1.10.2->t5s) (3.0.0)\n",
86
+ "Requirement already satisfied: dill in /usr/local/lib/python3.7/dist-packages (from datasets==1.10.2->t5s) (0.3.4)\n",
87
+ "Collecting huggingface-hub<0.1.0\n",
88
+ " Downloading huggingface_hub-0.0.15-py3-none-any.whl (43 kB)\n",
89
+ "\u001b[K |████████████████████████████████| 43 kB 2.6 MB/s \n",
90
+ "\u001b[?25hCollecting xxhash\n",
91
+ " Downloading xxhash-2.0.2-cp37-cp37m-manylinux2010_x86_64.whl (243 kB)\n",
92
+ "\u001b[K |████████████████████████████████| 243 kB 73.4 MB/s \n",
93
+ "\u001b[?25hRequirement already satisfied: multiprocess in /usr/local/lib/python3.7/dist-packages (from datasets==1.10.2->t5s) (0.70.12.2)\n",
94
+ "Collecting tqdm>=4.42\n",
95
+ " Downloading tqdm-4.62.0-py2.py3-none-any.whl (76 kB)\n",
96
+ "\u001b[K |████████████████████████████████| 76 kB 6.1 MB/s \n",
97
+ "\u001b[?25hCollecting fsspec>=2021.05.0\n",
98
+ " Downloading fsspec-2021.7.0-py3-none-any.whl (118 kB)\n",
99
+ "\u001b[K |████████████████████████████████| 118 kB 73.9 MB/s \n",
100
+ "\u001b[?25hCollecting dictdiffer>=0.8.1\n",
101
+ " Downloading dictdiffer-0.9.0-py2.py3-none-any.whl (16 kB)\n",
102
+ "Collecting python-benedict>=0.21.1\n",
103
+ " Downloading python_benedict-0.24.1-py3-none-any.whl (40 kB)\n",
104
+ "\u001b[K |████████████████████████████████| 40 kB 7.1 MB/s \n",
105
+ "\u001b[?25hCollecting dulwich>=0.20.23\n",
106
+ " Downloading dulwich-0.20.24-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (529 kB)\n",
107
+ "\u001b[K |████████████████████████████████| 529 kB 84.6 MB/s \n",
108
+ "\u001b[?25hRequirement already satisfied: appdirs>=1.4.3 in /usr/local/lib/python3.7/dist-packages (from dvc==2.5.4->t5s) (1.4.4)\n",
109
+ "Collecting configobj>=5.0.6\n",
110
+ " Downloading configobj-5.0.6.tar.gz (33 kB)\n",
111
+ "Collecting psutil>=5.8.0\n",
112
+ " Downloading psutil-5.8.0-cp37-cp37m-manylinux2010_x86_64.whl (296 kB)\n",
113
+ "\u001b[K |████████████████████████████████| 296 kB 83.8 MB/s \n",
114
+ "\u001b[?25hRequirement already satisfied: typing-extensions>=3.7.4 in /usr/local/lib/python3.7/dist-packages (from dvc==2.5.4->t5s) (3.7.4.3)\n",
115
+ "Requirement already satisfied: pydot>=1.2.4 in /usr/local/lib/python3.7/dist-packages (from dvc==2.5.4->t5s) (1.3.0)\n",
116
+ "Requirement already satisfied: setuptools>=34.0.0 in /usr/local/lib/python3.7/dist-packages (from dvc==2.5.4->t5s) (57.2.0)\n",
117
+ "Collecting flatten-dict<1,>=0.3.0\n",
118
+ " Downloading flatten_dict-0.4.2-py2.py3-none-any.whl (9.7 kB)\n",
119
+ "Collecting pygit2>=1.5.0\n",
120
+ " Downloading pygit2-1.6.1-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (4.6 MB)\n",
121
+ "\u001b[K |████████████████████████████████| 4.6 MB 81.3 MB/s \n",
122
+ "\u001b[?25hCollecting pathspec>=0.6.0\n",
123
+ " Downloading pathspec-0.9.0-py2.py3-none-any.whl (31 kB)\n",
124
+ "Collecting shtab<2,>=1.3.4\n",
125
+ " Downloading shtab-1.3.10-py2.py3-none-any.whl (13 kB)\n",
126
+ "Collecting dpath<3,>=2.0.1\n",
127
+ " Downloading dpath-2.0.1.tar.gz (21 kB)\n",
128
+ "Collecting grandalf==0.6\n",
129
+ " Downloading grandalf-0.6-py3-none-any.whl (31 kB)\n",
130
+ "Requirement already satisfied: networkx~=2.5 in /usr/local/lib/python3.7/dist-packages (from dvc==2.5.4->t5s) (2.5.1)\n",
131
+ "Collecting ply>=3.9\n",
132
+ " Downloading ply-3.11-py2.py3-none-any.whl (49 kB)\n",
133
+ "\u001b[K |████████████████████████████████| 49 kB 8.2 MB/s \n",
134
+ "\u001b[?25hCollecting voluptuous>=0.11.7\n",
135
+ " Downloading voluptuous-0.12.1-py3-none-any.whl (29 kB)\n",
136
+ "Collecting ruamel.yaml>=0.16.1\n",
137
+ " Downloading ruamel.yaml-0.17.10-py3-none-any.whl (108 kB)\n",
138
+ "\u001b[K |████████████████████████████████| 108 kB 79.0 MB/s \n",
139
+ "\u001b[?25hCollecting zc.lockfile>=1.2.1\n",
140
+ " Downloading zc.lockfile-2.0-py2.py3-none-any.whl (9.7 kB)\n",
141
+ "Collecting nanotime>=0.5.2\n",
142
+ " Downloading nanotime-0.5.2.tar.gz (3.2 kB)\n",
143
+ "Collecting funcy>=1.14\n",
144
+ " Downloading funcy-1.16-py2.py3-none-any.whl (32 kB)\n",
145
+ "Collecting pygtrie>=2.3.2\n",
146
+ " Downloading pygtrie-2.4.2.tar.gz (35 kB)\n",
147
+ "Collecting gitpython>3\n",
148
+ " Downloading GitPython-3.1.18-py3-none-any.whl (170 kB)\n",
149
+ "\u001b[K |████████████████████████████████| 170 kB 70.9 MB/s \n",
150
+ "\u001b[?25hRequirement already satisfied: tabulate>=0.8.7 in /usr/local/lib/python3.7/dist-packages (from dvc==2.5.4->t5s) (0.8.9)\n",
151
+ "Requirement already satisfied: toml>=0.10.1 in /usr/local/lib/python3.7/dist-packages (from dvc==2.5.4->t5s) (0.10.2)\n",
152
+ "Requirement already satisfied: pyparsing==2.4.7 in /usr/local/lib/python3.7/dist-packages (from dvc==2.5.4->t5s) (2.4.7)\n",
153
+ "Collecting jsonpath-ng>=1.5.1\n",
154
+ " Downloading jsonpath_ng-1.5.3-py3-none-any.whl (29 kB)\n",
155
+ "Requirement already satisfied: pyasn1>=0.4.1 in /usr/local/lib/python3.7/dist-packages (from dvc==2.5.4->t5s) (0.4.8)\n",
156
+ "Collecting diskcache>=5.2.1\n",
157
+ " Downloading diskcache-5.2.1-py3-none-any.whl (44 kB)\n",
158
+ "\u001b[K |████████████████████████████████| 44 kB 3.5 MB/s \n",
159
+ "\u001b[?25hCollecting flufl.lock<4,>=3.2\n",
160
+ " Downloading flufl.lock-3.2.tar.gz (19 kB)\n",
161
+ "Collecting shortuuid>=0.5.0\n",
162
+ " Downloading shortuuid-1.0.1-py3-none-any.whl (7.5 kB)\n",
163
+ "Collecting colorama>=0.3.9\n",
164
+ " Downloading colorama-0.4.4-py2.py3-none-any.whl (16 kB)\n",
165
+ "Collecting rich>=10.0.0\n",
166
+ " Downloading rich-10.7.0-py3-none-any.whl (209 kB)\n",
167
+ "\u001b[K |████████████████████████████████| 209 kB 67.7 MB/s \n",
168
+ "\u001b[?25hCollecting distro>=1.3.0\n",
169
+ " Downloading distro-1.6.0-py2.py3-none-any.whl (19 kB)\n",
170
+ "Requirement already satisfied: future in /usr/local/lib/python3.7/dist-packages (from grandalf==0.6->dvc==2.5.4->t5s) (0.16.0)\n",
171
+ "Collecting databricks-cli>=0.8.7\n",
172
+ " Downloading databricks-cli-0.15.0.tar.gz (56 kB)\n",
173
+ "\u001b[K |████████████████████████████████| 56 kB 5.8 MB/s \n",
174
+ "\u001b[?25hCollecting docker>=4.0.0\n",
175
+ " Downloading docker-5.0.0-py2.py3-none-any.whl (146 kB)\n",
176
+ "\u001b[K |████████████████████████████████| 146 kB 81.5 MB/s \n",
177
+ "\u001b[?25hCollecting prometheus-flask-exporter\n",
178
+ " Downloading prometheus_flask_exporter-0.18.2.tar.gz (22 kB)\n",
179
+ "Requirement already satisfied: Flask in /usr/local/lib/python3.7/dist-packages (from mlflow==1.19.0->t5s) (1.1.4)\n",
180
+ "Collecting querystring-parser\n",
181
+ " Downloading querystring_parser-1.2.4-py2.py3-none-any.whl (7.9 kB)\n",
182
+ "Requirement already satisfied: sqlalchemy in /usr/local/lib/python3.7/dist-packages (from mlflow==1.19.0->t5s) (1.4.20)\n",
183
+ "Requirement already satisfied: pytz in /usr/local/lib/python3.7/dist-packages (from mlflow==1.19.0->t5s) (2018.9)\n",
184
+ "Requirement already satisfied: protobuf>=3.7.0 in /usr/local/lib/python3.7/dist-packages (from mlflow==1.19.0->t5s) (3.17.3)\n",
185
+ "Requirement already satisfied: cloudpickle in /usr/local/lib/python3.7/dist-packages (from mlflow==1.19.0->t5s) (1.3.0)\n",
186
+ "Requirement already satisfied: entrypoints in /usr/local/lib/python3.7/dist-packages (from mlflow==1.19.0->t5s) (0.3)\n",
187
+ "Collecting alembic<=1.4.1\n",
188
+ " Downloading alembic-1.4.1.tar.gz (1.1 MB)\n",
189
+ "\u001b[K |████████████████████████████████| 1.1 MB 77.7 MB/s \n",
190
+ "\u001b[?25hCollecting gunicorn\n",
191
+ " Downloading gunicorn-20.1.0-py3-none-any.whl (79 kB)\n",
192
+ "\u001b[K |████████████████████████████████| 79 kB 10.9 MB/s \n",
193
+ "\u001b[?25hRequirement already satisfied: sqlparse>=0.3.1 in /usr/local/lib/python3.7/dist-packages (from mlflow==1.19.0->t5s) (0.4.1)\n",
194
+ "Requirement already satisfied: python-dateutil>=2.7.3 in /usr/local/lib/python3.7/dist-packages (from pandas==1.1.5->t5s) (2.8.1)\n",
195
+ "Collecting torchmetrics>=0.2.0\n",
196
+ " Downloading torchmetrics-0.5.0-py3-none-any.whl (272 kB)\n",
197
+ "\u001b[K |████████████████████████████████| 272 kB 67.2 MB/s \n",
198
+ "\u001b[?25hCollecting future\n",
199
+ " Downloading future-0.18.2.tar.gz (829 kB)\n",
200
+ "\u001b[K |████████████████████████████████| 829 kB 58.5 MB/s \n",
201
+ "\u001b[?25hCollecting tensorboard!=2.5.0,>=2.2.0\n",
202
+ " Downloading tensorboard-2.6.0-py3-none-any.whl (5.6 MB)\n",
203
+ "\u001b[K |████████████████████████████████| 5.6 MB 63.6 MB/s \n",
204
+ "\u001b[?25hCollecting pyDeprecate==0.3.0\n",
205
+ " Downloading pyDeprecate-0.3.0-py3-none-any.whl (10 kB)\n",
206
+ "Requirement already satisfied: absl-py in /usr/local/lib/python3.7/dist-packages (from rouge-score==0.0.4->t5s) (0.12.0)\n",
207
+ "Requirement already satisfied: six>=1.14.0 in /usr/local/lib/python3.7/dist-packages (from rouge-score==0.0.4->t5s) (1.15.0)\n",
208
+ "Requirement already satisfied: nltk in /usr/local/lib/python3.7/dist-packages (from rouge-score==0.0.4->t5s) (3.2.5)\n",
209
+ "Requirement already satisfied: altair>=3.2.0 in /usr/local/lib/python3.7/dist-packages (from streamlit==0.85.1->t5s) (4.1.0)\n",
210
+ "Requirement already satisfied: attrs in /usr/local/lib/python3.7/dist-packages (from streamlit==0.85.1->t5s) (21.2.0)\n",
211
+ "Requirement already satisfied: cachetools>=4.0 in /usr/local/lib/python3.7/dist-packages (from streamlit==0.85.1->t5s) (4.2.2)\n",
212
+ "Collecting base58\n",
213
+ " Downloading base58-2.1.0-py3-none-any.whl (5.6 kB)\n",
214
+ "Collecting pydeck>=0.1.dev5\n",
215
+ " Downloading pydeck-0.6.2-py2.py3-none-any.whl (4.2 MB)\n",
216
+ "\u001b[K |████████████████████████████████| 4.2 MB 63.3 MB/s \n",
217
+ "\u001b[?25hCollecting watchdog\n",
218
+ " Downloading watchdog-2.1.3-py3-none-manylinux2014_x86_64.whl (75 kB)\n",
219
+ "\u001b[K |████████████████████████████████| 75 kB 4.7 MB/s \n",
220
+ "\u001b[?25hCollecting blinker\n",
221
+ " Downloading blinker-1.4.tar.gz (111 kB)\n",
222
+ "\u001b[K |████████████████████████████████| 111 kB 73.9 MB/s \n",
223
+ "\u001b[?25hCollecting validators\n",
224
+ " Downloading validators-0.18.2-py3-none-any.whl (19 kB)\n",
225
+ "Requirement already satisfied: tzlocal in /usr/local/lib/python3.7/dist-packages (from streamlit==0.85.1->t5s) (1.5.1)\n",
226
+ "Requirement already satisfied: pillow>=6.2.0 in /usr/local/lib/python3.7/dist-packages (from streamlit==0.85.1->t5s) (7.1.2)\n",
227
+ "Requirement already satisfied: astor in /usr/local/lib/python3.7/dist-packages (from streamlit==0.85.1->t5s) (0.8.1)\n",
228
+ "Requirement already satisfied: tornado>=5.0 in /usr/local/lib/python3.7/dist-packages (from streamlit==0.85.1->t5s) (5.1.1)\n",
229
+ "Collecting sacremoses\n",
230
+ " Downloading sacremoses-0.0.45-py3-none-any.whl (895 kB)\n",
231
+ "\u001b[K |████████████████████████████████| 895 kB 45.6 MB/s \n",
232
+ "\u001b[?25hRequirement already satisfied: filelock in /usr/local/lib/python3.7/dist-packages (from transformers==4.9.0->t5s) (3.0.12)\n",
233
+ "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.7/dist-packages (from transformers==4.9.0->t5s) (2019.12.20)\n",
234
+ "Collecting tokenizers<0.11,>=0.10.1\n",
235
+ " Downloading tokenizers-0.10.3-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (3.3 MB)\n",
236
+ "\u001b[K |████████████████████████████████| 3.3 MB 53.9 MB/s \n",
237
+ "\u001b[?25hCollecting huggingface-hub<0.1.0\n",
238
+ " Downloading huggingface_hub-0.0.12-py3-none-any.whl (37 kB)\n",
239
+ "Collecting Mako\n",
240
+ " Downloading Mako-1.1.4-py2.py3-none-any.whl (75 kB)\n",
241
+ "\u001b[K |████████████████████████████████| 75 kB 4.6 MB/s \n",
242
+ "\u001b[?25hCollecting python-editor>=0.3\n",
243
+ " Downloading python_editor-1.0.4-py3-none-any.whl (4.9 kB)\n",
244
+ "Requirement already satisfied: toolz in /usr/local/lib/python3.7/dist-packages (from altair>=3.2.0->streamlit==0.85.1->t5s) (0.11.1)\n",
245
+ "Requirement already satisfied: jsonschema in /usr/local/lib/python3.7/dist-packages (from altair>=3.2.0->streamlit==0.85.1->t5s) (2.6.0)\n",
246
+ "Requirement already satisfied: jinja2 in /usr/local/lib/python3.7/dist-packages (from altair>=3.2.0->streamlit==0.85.1->t5s) (2.11.3)\n",
247
+ "Collecting websocket-client>=0.32.0\n",
248
+ " Downloading websocket_client-1.1.1-py2.py3-none-any.whl (68 kB)\n",
249
+ "\u001b[K |████████████████████████████████| 68 kB 8.9 MB/s \n",
250
+ "\u001b[?25hRequirement already satisfied: certifi in /usr/local/lib/python3.7/dist-packages (from dulwich>=0.20.23->dvc==2.5.4->t5s) (2021.5.30)\n",
251
+ "Requirement already satisfied: urllib3>=1.24.1 in /usr/local/lib/python3.7/dist-packages (from dulwich>=0.20.23->dvc==2.5.4->t5s) (1.24.3)\n",
252
+ "Collecting atpublic\n",
253
+ " Downloading atpublic-2.3.tar.gz (16 kB)\n",
254
+ "Collecting aiohttp\n",
255
+ " Downloading aiohttp-3.7.4.post0-cp37-cp37m-manylinux2014_x86_64.whl (1.3 MB)\n",
256
+ "\u001b[K |████████████████████████████████| 1.3 MB 74.9 MB/s \n",
257
+ "\u001b[?25hCollecting gitdb<5,>=4.0.1\n",
258
+ " Downloading gitdb-4.0.7-py3-none-any.whl (63 kB)\n",
259
+ "\u001b[K |████████████████████████████████| 63 kB 2.5 MB/s \n",
260
+ "\u001b[?25hCollecting smmap<5,>=3.0.1\n",
261
+ " Downloading smmap-4.0.0-py2.py3-none-any.whl (24 kB)\n",
262
+ "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata->datasets==1.10.2->t5s) (3.5.0)\n",
263
+ "Requirement already satisfied: decorator in /usr/local/lib/python3.7/dist-packages (from jsonpath-ng>=1.5.1->dvc==2.5.4->t5s) (4.4.2)\n",
264
+ "Collecting ipykernel>=5.1.2\n",
265
+ " Downloading ipykernel-6.0.3-py3-none-any.whl (122 kB)\n",
266
+ "\u001b[K |████████████████████████████████| 122 kB 71.2 MB/s \n",
267
+ "\u001b[?25hRequirement already satisfied: ipywidgets>=7.0.0 in /usr/local/lib/python3.7/dist-packages (from pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (7.6.3)\n",
268
+ "Requirement already satisfied: traitlets>=4.3.2 in /usr/local/lib/python3.7/dist-packages (from pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (5.0.5)\n",
269
+ "Requirement already satisfied: debugpy<2.0,>=1.0.0 in /usr/local/lib/python3.7/dist-packages (from ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (1.0.0)\n",
270
+ "Requirement already satisfied: jupyter-client<7.0 in /usr/local/lib/python3.7/dist-packages (from ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (5.3.5)\n",
271
+ "Collecting ipython<8.0,>=7.23.1\n",
272
+ " Downloading ipython-7.26.0-py3-none-any.whl (786 kB)\n",
273
+ "\u001b[K |████████████████████████████████| 786 kB 84.4 MB/s \n",
274
+ "\u001b[?25hRequirement already satisfied: matplotlib-inline<0.2.0,>=0.1.0 in /usr/local/lib/python3.7/dist-packages (from ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.1.2)\n",
275
+ "Collecting importlib-metadata\n",
276
+ " Downloading importlib_metadata-3.10.1-py3-none-any.whl (14 kB)\n",
277
+ "Requirement already satisfied: pickleshare in /usr/local/lib/python3.7/dist-packages (from ipython<8.0,>=7.23.1->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.7.5)\n",
278
+ "Requirement already satisfied: pexpect>4.3 in /usr/local/lib/python3.7/dist-packages (from ipython<8.0,>=7.23.1->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (4.8.0)\n",
279
+ "Collecting prompt-toolkit!=3.0.0,!=3.0.1,<3.1.0,>=2.0.0\n",
280
+ " Downloading prompt_toolkit-3.0.19-py3-none-any.whl (368 kB)\n",
281
+ "\u001b[K |████████████████████████████████| 368 kB 66.7 MB/s \n",
282
+ "\u001b[?25hRequirement already satisfied: jedi>=0.16 in /usr/local/lib/python3.7/dist-packages (from ipython<8.0,>=7.23.1->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.18.0)\n",
283
+ "Requirement already satisfied: backcall in /usr/local/lib/python3.7/dist-packages (from ipython<8.0,>=7.23.1->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.2.0)\n",
284
+ "Requirement already satisfied: pygments in /usr/local/lib/python3.7/dist-packages (from ipython<8.0,>=7.23.1->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (2.6.1)\n",
285
+ "Requirement already satisfied: nbformat>=4.2.0 in /usr/local/lib/python3.7/dist-packages (from ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (5.1.3)\n",
286
+ "Requirement already satisfied: widgetsnbextension~=3.5.0 in /usr/local/lib/python3.7/dist-packages (from ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (3.5.1)\n",
287
+ "Requirement already satisfied: jupyterlab-widgets>=1.0.0 in /usr/local/lib/python3.7/dist-packages (from ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (1.0.0)\n",
288
+ "Requirement already satisfied: parso<0.9.0,>=0.8.0 in /usr/local/lib/python3.7/dist-packages (from jedi>=0.16->ipython<8.0,>=7.23.1->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.8.2)\n",
289
+ "Requirement already satisfied: MarkupSafe>=0.23 in /usr/local/lib/python3.7/dist-packages (from jinja2->altair>=3.2.0->streamlit==0.85.1->t5s) (2.0.1)\n",
290
+ "Requirement already satisfied: pyzmq>=13 in /usr/local/lib/python3.7/dist-packages (from jupyter-client<7.0->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (22.1.0)\n",
291
+ "Requirement already satisfied: jupyter-core>=4.6.0 in /usr/local/lib/python3.7/dist-packages (from jupyter-client<7.0->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (4.7.1)\n",
292
+ "Requirement already satisfied: ipython-genutils in /usr/local/lib/python3.7/dist-packages (from nbformat>=4.2.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.2.0)\n",
293
+ "Requirement already satisfied: ptyprocess>=0.5 in /usr/local/lib/python3.7/dist-packages (from pexpect>4.3->ipython<8.0,>=7.23.1->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.7.0)\n",
294
+ "Requirement already satisfied: wcwidth in /usr/local/lib/python3.7/dist-packages (from prompt-toolkit!=3.0.0,!=3.0.1,<3.1.0,>=2.0.0->ipython<8.0,>=7.23.1->ipykernel>=5.1.2->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.2.5)\n",
295
+ "Requirement already satisfied: cached-property in /usr/local/lib/python3.7/dist-packages (from pygit2>=1.5.0->dvc==2.5.4->t5s) (1.5.2)\n",
296
+ "Requirement already satisfied: cffi>=1.4.0 in /usr/local/lib/python3.7/dist-packages (from pygit2>=1.5.0->dvc==2.5.4->t5s) (1.14.6)\n",
297
+ "Requirement already satisfied: pycparser in /usr/local/lib/python3.7/dist-packages (from cffi>=1.4.0->pygit2>=1.5.0->dvc==2.5.4->t5s) (2.20)\n",
298
+ "Collecting ftfy\n",
299
+ " Downloading ftfy-6.0.3.tar.gz (64 kB)\n",
300
+ "\u001b[K |████████████████████████████████| 64 kB 3.7 MB/s \n",
301
+ "\u001b[?25hRequirement already satisfied: python-slugify in /usr/local/lib/python3.7/dist-packages (from python-benedict>=0.21.1->dvc==2.5.4->t5s) (5.0.2)\n",
302
+ "Collecting mailchecker\n",
303
+ " Downloading mailchecker-4.0.11.tar.gz (201 kB)\n",
304
+ "\u001b[K |████████████████████████████████| 201 kB 60.6 MB/s \n",
305
+ "\u001b[?25hCollecting python-fsutil\n",
306
+ " Downloading python_fsutil-0.5.0-py3-none-any.whl (11 kB)\n",
307
+ "Collecting phonenumbers\n",
308
+ " Downloading phonenumbers-8.12.29-py2.py3-none-any.whl (2.6 MB)\n",
309
+ "\u001b[K |████████████████████████████████| 2.6 MB 46.9 MB/s \n",
310
+ "\u001b[?25hCollecting xmltodict\n",
311
+ " Downloading xmltodict-0.12.0-py2.py3-none-any.whl (9.2 kB)\n",
312
+ "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests>=2.19.0->datasets==1.10.2->t5s) (2.10)\n",
313
+ "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests>=2.19.0->datasets==1.10.2->t5s) (3.0.4)\n",
314
+ "Collecting commonmark<0.10.0,>=0.9.0\n",
315
+ " Downloading commonmark-0.9.1-py2.py3-none-any.whl (51 kB)\n",
316
+ "\u001b[K |████████████████████████████████| 51 kB 8.0 MB/s \n",
317
+ "\u001b[?25hCollecting ruamel.yaml.clib>=0.1.2\n",
318
+ " Downloading ruamel.yaml.clib-0.2.6-cp37-cp37m-manylinux1_x86_64.whl (546 kB)\n",
319
+ "\u001b[K |████████████████████████████████| 546 kB 78.5 MB/s \n",
320
+ "\u001b[?25hRequirement already satisfied: greenlet!=0.4.17 in /usr/local/lib/python3.7/dist-packages (from sqlalchemy->mlflow==1.19.0->t5s) (1.1.0)\n",
321
+ "Requirement already satisfied: grpcio>=1.24.3 in /usr/local/lib/python3.7/dist-packages (from tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (1.34.1)\n",
322
+ "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.7/dist-packages (from tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (3.3.4)\n",
323
+ "Requirement already satisfied: werkzeug>=0.11.15 in /usr/local/lib/python3.7/dist-packages (from tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (1.0.1)\n",
324
+ "Requirement already satisfied: google-auth-oauthlib<0.5,>=0.4.1 in /usr/local/lib/python3.7/dist-packages (from tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (0.4.4)\n",
325
+ "Requirement already satisfied: wheel>=0.26 in /usr/local/lib/python3.7/dist-packages (from tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (0.36.2)\n",
326
+ "Requirement already satisfied: tensorboard-plugin-wit>=1.6.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (1.8.0)\n",
327
+ "Requirement already satisfied: tensorboard-data-server<0.7.0,>=0.6.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (0.6.1)\n",
328
+ "Requirement already satisfied: google-auth<2,>=1.6.3 in /usr/local/lib/python3.7/dist-packages (from tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (1.32.1)\n",
329
+ "Requirement already satisfied: pyasn1-modules>=0.2.1 in /usr/local/lib/python3.7/dist-packages (from google-auth<2,>=1.6.3->tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (0.2.8)\n",
330
+ "Requirement already satisfied: rsa<5,>=3.1.4 in /usr/local/lib/python3.7/dist-packages (from google-auth<2,>=1.6.3->tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (4.7.2)\n",
331
+ "Requirement already satisfied: requests-oauthlib>=0.7.0 in /usr/local/lib/python3.7/dist-packages (from google-auth-oauthlib<0.5,>=0.4.1->tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (1.3.0)\n",
332
+ "Requirement already satisfied: oauthlib>=3.0.0 in /usr/local/lib/python3.7/dist-packages (from requests-oauthlib>=0.7.0->google-auth-oauthlib<0.5,>=0.4.1->tensorboard!=2.5.0,>=2.2.0->pytorch-lightning==1.3.5->t5s) (3.1.1)\n",
333
+ "Requirement already satisfied: notebook>=4.4.1 in /usr/local/lib/python3.7/dist-packages (from widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (5.3.1)\n",
334
+ "Requirement already satisfied: Send2Trash in /usr/local/lib/python3.7/dist-packages (from notebook>=4.4.1->widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (1.7.1)\n",
335
+ "Requirement already satisfied: terminado>=0.8.1 in /usr/local/lib/python3.7/dist-packages (from notebook>=4.4.1->widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.10.1)\n",
336
+ "Requirement already satisfied: nbconvert in /usr/local/lib/python3.7/dist-packages (from notebook>=4.4.1->widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (5.6.1)\n",
337
+ "Collecting async-timeout<4.0,>=3.0\n",
338
+ " Downloading async_timeout-3.0.1-py3-none-any.whl (8.2 kB)\n",
339
+ "Collecting yarl<2.0,>=1.0\n",
340
+ " Downloading yarl-1.6.3-cp37-cp37m-manylinux2014_x86_64.whl (294 kB)\n",
341
+ "\u001b[K |████████████████████████████████| 294 kB 64.6 MB/s \n",
342
+ "\u001b[?25hCollecting multidict<7.0,>=4.5\n",
343
+ " Downloading multidict-5.1.0-cp37-cp37m-manylinux2014_x86_64.whl (142 kB)\n",
344
+ "\u001b[K |████████████████████████████████| 142 kB 65.0 MB/s \n",
345
+ "\u001b[?25hCollecting s3transfer<0.6.0,>=0.5.0\n",
346
+ " Downloading s3transfer-0.5.0-py3-none-any.whl (79 kB)\n",
347
+ "\u001b[K |████████████████████████████████| 79 kB 10.8 MB/s \n",
348
+ "\u001b[?25hCollecting docutils<0.16,>=0.10\n",
349
+ " Downloading docutils-0.15.2-py3-none-any.whl (547 kB)\n",
350
+ "\u001b[K |████████████████████████████████| 547 kB 60.9 MB/s \n",
351
+ "\u001b[?25hCollecting botocore==1.21.18\n",
352
+ " Downloading botocore-1.21.18-py3-none-any.whl (7.8 MB)\n",
353
+ "\u001b[K |████████████████████████████████| 7.8 MB 48.9 MB/s \n",
354
+ "\u001b[?25hCollecting colorama>=0.3.9\n",
355
+ " Downloading colorama-0.4.3-py2.py3-none-any.whl (15 kB)\n",
356
+ "Collecting jmespath<1.0.0,>=0.7.1\n",
357
+ " Downloading jmespath-0.10.0-py2.py3-none-any.whl (24 kB)\n",
358
+ "Collecting urllib3>=1.24.1\n",
359
+ " Downloading urllib3-1.25.11-py2.py3-none-any.whl (127 kB)\n",
360
+ "\u001b[K |████████████████████████████████| 127 kB 77.1 MB/s \n",
361
+ "\u001b[?25hCollecting typed-ast>=1.4.2\n",
362
+ " Downloading typed_ast-1.4.3-cp37-cp37m-manylinux1_x86_64.whl (743 kB)\n",
363
+ "\u001b[K |████████████████████████████████| 743 kB 51.4 MB/s \n",
364
+ "\u001b[?25hCollecting mypy-extensions>=0.4.3\n",
365
+ " Downloading mypy_extensions-0.4.3-py2.py3-none-any.whl (4.5 kB)\n",
366
+ "Collecting regex!=2019.12.17\n",
367
+ " Downloading regex-2021.8.3-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (722 kB)\n",
368
+ "\u001b[K |████████████████████████████████| 722 kB 80.3 MB/s \n",
369
+ "\u001b[?25hCollecting tomli<2.0.0,>=0.2.6\n",
370
+ " Downloading tomli-1.2.1-py3-none-any.whl (11 kB)\n",
371
+ "Collecting pycodestyle<2.8.0,>=2.7.0\n",
372
+ " Downloading pycodestyle-2.7.0-py2.py3-none-any.whl (41 kB)\n",
373
+ "\u001b[K |████████████████████████████████| 41 kB 800 kB/s \n",
374
+ "\u001b[?25hCollecting mccabe<0.7.0,>=0.6.0\n",
375
+ " Downloading mccabe-0.6.1-py2.py3-none-any.whl (8.6 kB)\n",
376
+ "Collecting pyflakes<2.4.0,>=2.3.0\n",
377
+ " Downloading pyflakes-2.3.1-py2.py3-none-any.whl (68 kB)\n",
378
+ "\u001b[K |████████████████████████████████| 68 kB 9.2 MB/s \n",
379
+ "\u001b[?25hRequirement already satisfied: itsdangerous<2.0,>=0.24 in /usr/local/lib/python3.7/dist-packages (from Flask->mlflow==1.19.0->t5s) (1.1.0)\n",
380
+ "Requirement already satisfied: mistune<2,>=0.8.1 in /usr/local/lib/python3.7/dist-packages (from nbconvert->notebook>=4.4.1->widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.8.4)\n",
381
+ "Requirement already satisfied: pandocfilters>=1.4.1 in /usr/local/lib/python3.7/dist-packages (from nbconvert->notebook>=4.4.1->widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (1.4.3)\n",
382
+ "Requirement already satisfied: bleach in /usr/local/lib/python3.7/dist-packages (from nbconvert->notebook>=4.4.1->widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (3.3.0)\n",
383
+ "Requirement already satisfied: testpath in /usr/local/lib/python3.7/dist-packages (from nbconvert->notebook>=4.4.1->widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.5.0)\n",
384
+ "Requirement already satisfied: defusedxml in /usr/local/lib/python3.7/dist-packages (from nbconvert->notebook>=4.4.1->widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.7.1)\n",
385
+ "Requirement already satisfied: webencodings in /usr/local/lib/python3.7/dist-packages (from bleach->nbconvert->notebook>=4.4.1->widgetsnbextension~=3.5.0->ipywidgets>=7.0.0->pydeck>=0.1.dev5->streamlit==0.85.1->t5s) (0.5.1)\n",
386
+ "Requirement already satisfied: prometheus_client in /usr/local/lib/python3.7/dist-packages (from prometheus-flask-exporter->mlflow==1.19.0->t5s) (0.11.0)\n",
387
+ "Requirement already satisfied: text-unidecode>=1.3 in /usr/local/lib/python3.7/dist-packages (from python-slugify->python-benedict>=0.21.1->dvc==2.5.4->t5s) (1.3)\n",
388
+ "Requirement already satisfied: joblib in /usr/local/lib/python3.7/dist-packages (from sacremoses->transformers==4.9.0->t5s) (1.0.1)\n",
389
+ "Building wheels for collected packages: alembic, configobj, databricks-cli, dpath, flufl.lock, future, nanotime, pygtrie, atpublic, blinker, ftfy, mailchecker, prometheus-flask-exporter\n",
390
+ " Building wheel for alembic (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
391
+ " Created wheel for alembic: filename=alembic-1.4.1-py2.py3-none-any.whl size=158170 sha256=20ad21344dd1659d217c9af67cff17c335d06beb84b39d602951659a0b537f83\n",
392
+ " Stored in directory: /root/.cache/pip/wheels/be/5d/0a/9e13f53f4f5dfb67cd8d245bb7cdffe12f135846f491a283e3\n",
393
+ " Building wheel for configobj (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
394
+ " Created wheel for configobj: filename=configobj-5.0.6-py3-none-any.whl size=34547 sha256=fba9d1f14dc2e9360484cefb3742f8ccabba9ff57bd1aa25d34c06d6f56f1ce4\n",
395
+ " Stored in directory: /root/.cache/pip/wheels/0d/c4/19/13d74440f2a571841db6b6e0a273694327498884dafb9cf978\n",
396
+ " Building wheel for databricks-cli (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
397
+ " Created wheel for databricks-cli: filename=databricks_cli-0.15.0-py3-none-any.whl size=105259 sha256=f26ac8fd22b7d26afc1f2a651bc303248bb4b3288f26424079d090f0bc8dbad3\n",
398
+ " Stored in directory: /root/.cache/pip/wheels/e7/ba/75/284f9a90ff7a010bb23b9798f2e9a19dd9fe619379c917bff4\n",
399
+ " Building wheel for dpath (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
400
+ " Created wheel for dpath: filename=dpath-2.0.1-py3-none-any.whl size=15153 sha256=6c0c0fd902c652f5e2f8bcc660c925d6563bfe31a034fe28fbce1f3673c53047\n",
401
+ " Stored in directory: /root/.cache/pip/wheels/bc/f8/ae/bc69cb5f61393ebf9ade4cde41d1a813d35bfe78263a26f99e\n",
402
+ " Building wheel for flufl.lock (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
403
+ " Created wheel for flufl.lock: filename=flufl.lock-3.2-py3-none-any.whl size=19927 sha256=12059ea8c31a7c3012fa9fac08321da0dd2e161993875d5349098bdf10f21321\n",
404
+ " Stored in directory: /root/.cache/pip/wheels/49/68/a0/8e7cb7bbf4990fc10b5a082aa0eb3ac66787ca11e8eca445b2\n",
405
+ " Building wheel for future (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
406
+ " Created wheel for future: filename=future-0.18.2-py3-none-any.whl size=491070 sha256=3065296c65b1cd133bd427cb975a4598ac22080f752dc05191f2cac7589d5f21\n",
407
+ " Stored in directory: /root/.cache/pip/wheels/56/b0/fe/4410d17b32f1f0c3cf54cdfb2bc04d7b4b8f4ae377e2229ba0\n",
408
+ " Building wheel for nanotime (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
409
+ " Created wheel for nanotime: filename=nanotime-0.5.2-py3-none-any.whl size=2440 sha256=fd0ec6cd1d5a377a38b2d8420249ee5a2a40d3c3ac9027a63df96eccb65d33a9\n",
410
+ " Stored in directory: /root/.cache/pip/wheels/b8/92/aa/456d462c908b4e210c3928f778d28f94049fc9e47af8b191c9\n",
411
+ " Building wheel for pygtrie (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
412
+ " Created wheel for pygtrie: filename=pygtrie-2.4.2-py3-none-any.whl size=19061 sha256=1f0abccd08f95a448d171de8251128d943c397f23889049a377f1259757b5f4f\n",
413
+ " Stored in directory: /root/.cache/pip/wheels/d3/f8/ba/1d828b1603ea422686eb694253a43cb3a5901ea4696c1e0603\n",
414
+ " Building wheel for atpublic (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
415
+ " Created wheel for atpublic: filename=atpublic-2.3-py3-none-any.whl size=5032 sha256=7da4354afc862c36dee40560733e41cad62646a6b3361fbe79d8722ae56620ce\n",
416
+ " Stored in directory: /root/.cache/pip/wheels/46/d9/0f/54be2ecb4bcb1612f987f0b6482d88fa7f3e43d3946f36a32a\n",
417
+ " Building wheel for blinker (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
418
+ " Created wheel for blinker: filename=blinker-1.4-py3-none-any.whl size=13479 sha256=f6807d6fec7557bd3b537d3dc4ac317ff9e119f8548cf6c9b832761a664106c0\n",
419
+ " Stored in directory: /root/.cache/pip/wheels/22/f5/18/df711b66eb25b21325c132757d4314db9ac5e8dabeaf196eab\n",
420
+ " Building wheel for ftfy (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
421
+ " Created wheel for ftfy: filename=ftfy-6.0.3-py3-none-any.whl size=41934 sha256=140f2cf4ce8ed83edf9537a463a9b230bbf147b4ab5bc269e95f146e6ec59d2e\n",
422
+ " Stored in directory: /root/.cache/pip/wheels/19/f5/38/273eb3b5e76dfd850619312f693716ac4518b498f5ffb6f56d\n",
423
+ " Building wheel for mailchecker (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
424
+ " Created wheel for mailchecker: filename=mailchecker-4.0.11-py3-none-any.whl size=201671 sha256=b50a4a12a341a53472ddc32efd54228a6741dc41a2ccfb865737841e0382c0c1\n",
425
+ " Stored in directory: /root/.cache/pip/wheels/0b/cd/39/230bf7caff55afc08eb4a1d433731706d76fde0b95d70df3ca\n",
426
+ " Building wheel for prometheus-flask-exporter (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
427
+ " Created wheel for prometheus-flask-exporter: filename=prometheus_flask_exporter-0.18.2-py3-none-any.whl size=17416 sha256=9e08ca8dfee8cbea10b2e4d0ccc948d085aeda03278bd2ad97239a28092ce8e6\n",
428
+ " Stored in directory: /root/.cache/pip/wheels/6a/1e/1c/c765920cb92b2f0343d2dd8b481a407cee2823f9b4bbd2e52a\n",
429
+ "Successfully built alembic configobj databricks-cli dpath flufl.lock future nanotime pygtrie atpublic blinker ftfy mailchecker prometheus-flask-exporter\n",
430
+ "Installing collected packages: prompt-toolkit, ipython, importlib-metadata, urllib3, ipykernel, multidict, yarl, smmap, numpy, jmespath, async-timeout, xmltodict, websocket-client, tqdm, ruamel.yaml.clib, regex, pyyaml, python-fsutil, python-editor, ply, phonenumbers, Mako, mailchecker, gitdb, future, ftfy, fsspec, commonmark, colorama, botocore, atpublic, aiohttp, zc.lockfile, xxhash, watchdog, voluptuous, validators, typed-ast, torchmetrics, tomli, tokenizers, tensorboard, shtab, shortuuid, sacremoses, s3transfer, ruamel.yaml, rich, querystring-parser, python-benedict, pygtrie, pygit2, pyflakes, pyDeprecate, pydeck, pycodestyle, psutil, prometheus-flask-exporter, pathspec, nanotime, mypy-extensions, mccabe, jsonpath-ng, huggingface-hub, gunicorn, grandalf, gitpython, funcy, flufl.lock, flatten-dict, dulwich, dpath, docutils, docker, distro, diskcache, dictdiffer, databricks-cli, configobj, blinker, base58, alembic, transformers, streamlit, rouge-score, pytorch-lightning, python-dotenv, mlflow, flake8, dvc, datasets, dagshub, black, awscli, t5s\n",
431
+ " Attempting uninstall: prompt-toolkit\n",
432
+ " Found existing installation: prompt-toolkit 1.0.18\n",
433
+ " Uninstalling prompt-toolkit-1.0.18:\n",
434
+ " Successfully uninstalled prompt-toolkit-1.0.18\n",
435
+ " Attempting uninstall: ipython\n",
436
+ " Found existing installation: ipython 5.5.0\n",
437
+ " Uninstalling ipython-5.5.0:\n",
438
+ " Successfully uninstalled ipython-5.5.0\n",
439
+ " Attempting uninstall: importlib-metadata\n",
440
+ " Found existing installation: importlib-metadata 4.6.1\n",
441
+ " Uninstalling importlib-metadata-4.6.1:\n",
442
+ " Successfully uninstalled importlib-metadata-4.6.1\n",
443
+ " Attempting uninstall: urllib3\n",
444
+ " Found existing installation: urllib3 1.24.3\n",
445
+ " Uninstalling urllib3-1.24.3:\n",
446
+ " Successfully uninstalled urllib3-1.24.3\n",
447
+ " Attempting uninstall: ipykernel\n",
448
+ " Found existing installation: ipykernel 4.10.1\n",
449
+ " Uninstalling ipykernel-4.10.1:\n",
450
+ " Successfully uninstalled ipykernel-4.10.1\n",
451
+ " Attempting uninstall: numpy\n",
452
+ " Found existing installation: numpy 1.19.5\n",
453
+ " Uninstalling numpy-1.19.5:\n",
454
+ " Successfully uninstalled numpy-1.19.5\n",
455
+ " Attempting uninstall: tqdm\n",
456
+ " Found existing installation: tqdm 4.41.1\n",
457
+ " Uninstalling tqdm-4.41.1:\n",
458
+ " Successfully uninstalled tqdm-4.41.1\n",
459
+ " Attempting uninstall: regex\n",
460
+ " Found existing installation: regex 2019.12.20\n",
461
+ " Uninstalling regex-2019.12.20:\n",
462
+ " Successfully uninstalled regex-2019.12.20\n",
463
+ " Attempting uninstall: pyyaml\n",
464
+ " Found existing installation: PyYAML 3.13\n",
465
+ " Uninstalling PyYAML-3.13:\n",
466
+ " Successfully uninstalled PyYAML-3.13\n",
467
+ " Attempting uninstall: future\n",
468
+ " Found existing installation: future 0.16.0\n",
469
+ " Uninstalling future-0.16.0:\n",
470
+ " Successfully uninstalled future-0.16.0\n",
471
+ " Attempting uninstall: tensorboard\n",
472
+ " Found existing installation: tensorboard 2.5.0\n",
473
+ " Uninstalling tensorboard-2.5.0:\n",
474
+ " Successfully uninstalled tensorboard-2.5.0\n",
475
+ " Attempting uninstall: psutil\n",
476
+ " Found existing installation: psutil 5.4.8\n",
477
+ " Uninstalling psutil-5.4.8:\n",
478
+ " Successfully uninstalled psutil-5.4.8\n",
479
+ " Attempting uninstall: docutils\n",
480
+ " Found existing installation: docutils 0.17.1\n",
481
+ " Uninstalling docutils-0.17.1:\n",
482
+ " Successfully uninstalled docutils-0.17.1\n",
483
+ "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n",
484
+ "jupyter-console 5.2.0 requires prompt-toolkit<2.0.0,>=1.0.0, but you have prompt-toolkit 3.0.19 which is incompatible.\n",
485
+ "google-colab 1.0.0 requires ipykernel~=4.10, but you have ipykernel 6.0.3 which is incompatible.\n",
486
+ "google-colab 1.0.0 requires ipython~=5.5.0, but you have ipython 7.26.0 which is incompatible.\n",
487
+ "datascience 0.10.6 requires folium==0.2.1, but you have folium 0.8.3 which is incompatible.\n",
488
+ "albumentations 0.1.12 requires imgaug<0.2.7,>=0.2.5, but you have imgaug 0.2.9 which is incompatible.\u001b[0m\n",
489
+ "Successfully installed Mako-1.1.4 aiohttp-3.7.4.post0 alembic-1.4.1 async-timeout-3.0.1 atpublic-2.3 awscli-1.20.18 base58-2.1.0 black-21.7b0 blinker-1.4 botocore-1.21.18 colorama-0.4.3 commonmark-0.9.1 configobj-5.0.6 dagshub-0.1.7 databricks-cli-0.15.0 datasets-1.10.2 dictdiffer-0.9.0 diskcache-5.2.1 distro-1.6.0 docker-5.0.0 docutils-0.15.2 dpath-2.0.1 dulwich-0.20.24 dvc-2.5.4 flake8-3.9.2 flatten-dict-0.4.2 flufl.lock-3.2 fsspec-2021.7.0 ftfy-6.0.3 funcy-1.16 future-0.18.2 gitdb-4.0.7 gitpython-3.1.18 grandalf-0.6 gunicorn-20.1.0 huggingface-hub-0.0.12 importlib-metadata-3.10.1 ipykernel-6.0.3 ipython-7.26.0 jmespath-0.10.0 jsonpath-ng-1.5.3 mailchecker-4.0.11 mccabe-0.6.1 mlflow-1.19.0 multidict-5.1.0 mypy-extensions-0.4.3 nanotime-0.5.2 numpy-1.19.2 pathspec-0.9.0 phonenumbers-8.12.29 ply-3.11 prometheus-flask-exporter-0.18.2 prompt-toolkit-3.0.19 psutil-5.8.0 pyDeprecate-0.3.0 pycodestyle-2.7.0 pydeck-0.6.2 pyflakes-2.3.1 pygit2-1.6.1 pygtrie-2.4.2 python-benedict-0.24.1 python-dotenv-0.19.0 python-editor-1.0.4 python-fsutil-0.5.0 pytorch-lightning-1.3.5 pyyaml-5.4.1 querystring-parser-1.2.4 regex-2021.8.3 rich-10.7.0 rouge-score-0.0.4 ruamel.yaml-0.17.10 ruamel.yaml.clib-0.2.6 s3transfer-0.5.0 sacremoses-0.0.45 shortuuid-1.0.1 shtab-1.3.10 smmap-4.0.0 streamlit-0.85.1 t5s-1.0.4 tensorboard-2.6.0 tokenizers-0.10.3 tomli-1.2.1 torchmetrics-0.5.0 tqdm-4.62.0 transformers-4.9.0 typed-ast-1.4.3 urllib3-1.25.11 validators-0.18.2 voluptuous-0.12.1 watchdog-2.1.3 websocket-client-1.1.1 xmltodict-0.12.0 xxhash-2.0.2 yarl-1.6.3 zc.lockfile-2.0\n"
490
+ ],
491
+ "name": "stdout"
492
+ },
493
+ {
494
+ "output_type": "display_data",
495
+ "data": {
496
+ "application/vnd.colab-display-data+json": {
497
+ "pip_warning": {
498
+ "packages": [
499
+ "IPython",
500
+ "ipykernel",
501
+ "numpy",
502
+ "prompt_toolkit",
503
+ "psutil"
504
+ ]
505
+ }
506
+ }
507
+ },
508
+ "metadata": {
509
+ "tags": []
510
+ }
511
+ }
512
+ ]
513
+ },
514
+ {
515
+ "cell_type": "code",
516
+ "metadata": {
517
+ "colab": {
518
+ "base_uri": "https://localhost:8080/"
519
+ },
520
+ "id": "5Fe-bL2RrmMf",
521
+ "outputId": "d33d3c82-5633-4abe-d2b4-8e4d9da0d4e7"
522
+ },
523
+ "source": [
524
+ "!t5s clone"
525
+ ],
526
+ "execution_count": 2,
527
+ "outputs": [
528
+ {
529
+ "output_type": "stream",
530
+ "text": [
531
+ "arguments passed: clone\n",
532
+ "Cloning into 'summarization'...\n",
533
+ "remote: Enumerating objects: 958, done.\u001b[K\n",
534
+ "remote: Counting objects: 100% (958/958), done.\u001b[K\n",
535
+ "remote: Compressing objects: 100% (876/876), done.\u001b[K\n",
536
+ "remote: Total 958 (delta 552), reused 109 (delta 63)\u001b[K\n",
537
+ "Receiving objects: 100% (958/958), 129.99 KiB | 978.00 KiB/s, done.\n",
538
+ "Resolving deltas: 100% (552/552), done.\n",
539
+ "/content/summarization\n"
540
+ ],
541
+ "name": "stdout"
542
+ }
543
+ ]
544
+ },
545
+ {
546
+ "cell_type": "code",
547
+ "metadata": {
548
+ "colab": {
549
+ "base_uri": "https://localhost:8080/"
550
+ },
551
+ "id": "xIhaMYwhyEuv",
552
+ "outputId": "1ef86679-35eb-43ba-b545-df9bf9a9e4bb"
553
+ },
554
+ "source": [
555
+ "!t5s dirs"
556
+ ],
557
+ "execution_count": 4,
558
+ "outputs": [
559
+ {
560
+ "output_type": "stream",
561
+ "text": [
562
+ "arguments passed: dirs\n",
563
+ "/content/summarization\n",
564
+ "mkdir -p data/raw data/processed models\n"
565
+ ],
566
+ "name": "stdout"
567
+ }
568
+ ]
569
+ },
570
+ {
571
+ "cell_type": "code",
572
+ "metadata": {
573
+ "colab": {
574
+ "base_uri": "https://localhost:8080/"
575
+ },
576
+ "id": "hZqB-NlGzTC-",
577
+ "outputId": "3de5740c-2b4b-4119-ed9f-35da00236cce"
578
+ },
579
+ "source": [
580
+ "!t5s run"
581
+ ],
582
+ "execution_count": 5,
583
+ "outputs": [
584
+ {
585
+ "output_type": "stream",
586
+ "text": [
587
+ "arguments passed: run\n",
588
+ "/content/summarization\n",
589
+ "dvc repro eval\n",
590
+ "Running stage 'download_data':\n",
591
+ "> python src/data/make_dataset.py\n",
592
+ "{'data': 'cnn_dailymail', 'split': 0.001}\n",
593
+ "Downloading: 9.35kB [00:00, 8.50MB/s] \n",
594
+ "Downloading: 9.50kB [00:00, 8.98MB/s] \n",
595
+ "Downloading and preparing dataset cnn_dailymail/3.0.0 (download: 558.32 MiB, generated: 1.28 GiB, post-processed: Unknown size, total: 1.82 GiB) to /root/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/3cb851bf7cf5826e45d49db2863f627cba583cbc32342df7349dfe6c38060234...\n",
596
+ "Downloading: 159MB [00:05, 29.9MB/s]\n",
597
+ "Downloading: 376MB [00:12, 30.6MB/s]\n",
598
+ "Downloading: 2.11MB [00:00, 54.2MB/s] \n",
599
+ "Downloading: 46.4MB [00:00, 72.6MB/s]\n",
600
+ "Downloading: 2.43MB [00:00, 60.6MB/s] \n",
601
+ "Dataset cnn_dailymail downloaded and prepared to /root/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/3cb851bf7cf5826e45d49db2863f627cba583cbc32342df7349dfe6c38060234. Subsequent calls will reuse this data.\n",
602
+ "Reusing dataset cnn_dailymail (/root/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/3cb851bf7cf5826e45d49db2863f627cba583cbc32342df7349dfe6c38060234)\n",
603
+ "Reusing dataset cnn_dailymail (/root/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/3cb851bf7cf5826e45d49db2863f627cba583cbc32342df7349dfe6c38060234)\n",
604
+ "Computing md5 for a large file 'data/raw/train.csv'. This is only done once.\n",
605
+ "Computing file/dir hashes (only done once) |1.00 [00:00, 7.98md5/s]\n",
606
+ "data/raw/train.csv: 0% 0.00/1.17G [00:00<?, ?B/s]\u001b[A\n",
607
+ "data/raw/train.csv: 0% 0.00/1.17G [00:00<?, ?B/s{'info': ''}]\u001b[A\n",
608
+ "data/raw/train.csv: 3% 39.0M/1.17G [00:00<00:03, 402MB/s{'info': ''}]\u001b[A\n",
609
+ "data/raw/train.csv: 6% 75.0M/1.17G [00:00<00:03, 386MB/s{'info': ''}]\u001b[A\n",
610
+ "data/raw/train.csv: 10% 115M/1.17G [00:00<00:02, 399MB/s{'info': ''}] \u001b[A\n",
611
+ "data/raw/train.csv: 13% 154M/1.17G [00:00<00:02, 401MB/s{'info': ''}]\u001b[A\n",
612
+ "data/raw/train.csv: 16% 193M/1.17G [00:00<00:02, 403MB/s{'info': ''}]\u001b[A\n",
613
+ "data/raw/train.csv: 20% 233M/1.17G [00:00<00:02, 407MB/s{'info': ''}]\u001b[A\n",
614
+ "data/raw/train.csv: 23% 273M/1.17G [00:00<00:02, 411MB/s{'info': ''}]\u001b[A\n",
615
+ "data/raw/train.csv: 26% 312M/1.17G [00:00<00:02, 408MB/s{'info': ''}]\u001b[A\n",
616
+ "data/raw/train.csv: 29% 350M/1.17G [00:00<00:02, 405MB/s{'info': ''}]\u001b[A\n",
617
+ "data/raw/train.csv: 33% 389M/1.17G [00:01<00:02, 403MB/s{'info': ''}]\u001b[A\n",
618
+ "data/raw/train.csv: 36% 429M/1.17G [00:01<00:01, 407MB/s{'info': ''}]\u001b[A\n",
619
+ "data/raw/train.csv: 39% 469M/1.17G [00:01<00:01, 409MB/s{'info': ''}]\u001b[A\n",
620
+ "data/raw/train.csv: 43% 509M/1.17G [00:01<00:01, 410MB/s{'info': ''}]\u001b[A\n",
621
+ "data/raw/train.csv: 46% 549M/1.17G [00:01<00:01, 411MB/s{'info': ''}]\u001b[A\n",
622
+ "data/raw/train.csv: 49% 589M/1.17G [00:01<00:01, 411MB/s{'info': ''}]\u001b[A\n",
623
+ "data/raw/train.csv: 53% 628M/1.17G [00:01<00:01, 410MB/s{'info': ''}]\u001b[A\n",
624
+ "data/raw/train.csv: 56% 668M/1.17G [00:01<00:01, 411MB/s{'info': ''}]\u001b[A\n",
625
+ "data/raw/train.csv: 59% 709M/1.17G [00:01<00:01, 414MB/s{'info': ''}]\u001b[A\n",
626
+ "data/raw/train.csv: 63% 750M/1.17G [00:01<00:01, 417MB/s{'info': ''}]\u001b[A\n",
627
+ "data/raw/train.csv: 66% 790M/1.17G [00:02<00:01, 417MB/s{'info': ''}]\u001b[A\n",
628
+ "data/raw/train.csv: 70% 830M/1.17G [00:02<00:00, 417MB/s{'info': ''}]\u001b[A\n",
629
+ "data/raw/train.csv: 73% 871M/1.17G [00:02<00:00, 420MB/s{'info': ''}]\u001b[A\n",
630
+ "data/raw/train.csv: 76% 912M/1.17G [00:02<00:00, 420MB/s{'info': ''}]\u001b[A\n",
631
+ "data/raw/train.csv: 80% 952M/1.17G [00:02<00:00, 418MB/s{'info': ''}]\u001b[A\n",
632
+ "data/raw/train.csv: 83% 992M/1.17G [00:02<00:00, 417MB/s{'info': ''}]\u001b[A\n",
633
+ "data/raw/train.csv: 86% 1.01G/1.17G [00:02<00:00, 412MB/s{'info': ''}]\u001b[A\n",
634
+ "data/raw/train.csv: 90% 1.05G/1.17G [00:02<00:00, 412MB/s{'info': ''}]\u001b[A\n",
635
+ "data/raw/train.csv: 93% 1.08G/1.17G [00:02<00:00, 414MB/s{'info': ''}]\u001b[A\n",
636
+ "data/raw/train.csv: 96% 1.12G/1.17G [00:02<00:00, 413MB/s{'info': ''}]\u001b[A\n",
637
+ "data/raw/train.csv: 100% 1.16G/1.17G [00:03<00:00, 415MB/s{'info': ''}]\u001b[A\n",
638
+ "\n",
639
+ "Running stage 'process_data':\n",
640
+ "> python src/data/process_data.py\n",
641
+ "tcmalloc: large alloc 1073741824 bytes == 0x55d3719fa000 @ 0x7fb648ace2a4 0x7fb636a549f5 0x7fb636a55d42 0x7fb636a5745e 0x7fb636a29068 0x7fb636a28510 0x7fb636a23f4e 0x7fb636a08fe4 0x55d32f1ce010 0x55d32f2bfc0d 0x55d32f2420d8 0x55d32f23d235 0x55d32f1cf73a 0x55d32f23dd67 0x55d32f23cc35 0x55d32f1cf73a 0x55d32f23dd67 0x55d32f1cf65a 0x55d32f23db0e 0x55d32f23cc35 0x55d32f1cf73a 0x55d32f241f40 0x55d32f23cc35 0x55d32f1cf73a 0x55d32f23e93b 0x55d32f23cc35 0x55d32f23c933 0x55d32f306402 0x55d32f30677d 0x55d32f306626 0x55d32f2de313\n",
642
+ "tcmalloc: large alloc 2147483648 bytes == 0x55d3b19fa000 @ 0x7fb648ace2a4 0x7fb636a549f5 0x7fb636a55d42 0x7fb636a5745e 0x7fb636a29068 0x7fb636a28510 0x7fb636a23f4e 0x7fb636a08fe4 0x55d32f1ce010 0x55d32f2bfc0d 0x55d32f2420d8 0x55d32f23d235 0x55d32f1cf73a 0x55d32f23dd67 0x55d32f23cc35 0x55d32f1cf73a 0x55d32f23dd67 0x55d32f1cf65a 0x55d32f23db0e 0x55d32f23cc35 0x55d32f1cf73a 0x55d32f241f40 0x55d32f23cc35 0x55d32f1cf73a 0x55d32f23e93b 0x55d32f23cc35 0x55d32f23c933 0x55d32f306402 0x55d32f30677d 0x55d32f306626 0x55d32f2de313\n",
643
+ "Updating lock file 'dvc.lock'\n",
644
+ "\n",
645
+ "Running stage 'train':\n",
646
+ "> python src/models/train_model.py\n",
647
+ "2021-08-11 01:27:12.108655: I tensorflow/stream_executor/platform/default/dso_loader.cc:53] Successfully opened dynamic library libcudart.so.11.0\n",
648
+ "Global seed set to 42\n",
649
+ "Downloading: 100% 792k/792k [00:00<00:00, 3.83MB/s]\n",
650
+ "Downloading: 100% 1.39M/1.39M [00:00<00:00, 5.04MB/s]\n",
651
+ "Downloading: 100% 1.20k/1.20k [00:00<00:00, 977kB/s]\n",
652
+ "Downloading: 100% 242M/242M [00:07<00:00, 31.2MB/s]\n",
653
+ "GPU available: False, used: False\n",
654
+ "TPU available: False, using: 0 TPU cores\n",
655
+ "\n",
656
+ " | Name | Type | Params\n",
657
+ "-----------------------------------------------------\n",
658
+ "0 | model | T5ForConditionalGeneration | 60.5 M\n",
659
+ "-----------------------------------------------------\n",
660
+ "60.5 M Trainable params\n",
661
+ "0 Non-trainable params\n",
662
+ "60.5 M Total params\n",
663
+ "242.026 Total estimated model params size (MB)\n",
664
+ "Global seed set to 42\n",
665
+ "Epoch 0: 100% 2/2 [00:04<00:00, 2.39s/it]\n",
666
+ "Validating: 0it [00:00, ?it/s]\u001b[A\n",
667
+ "Validating: 0% 0/1 [00:00<?, ?it/s]\u001b[A\n",
668
+ "Epoch 0: 100% 2/2 [00:06<00:00, 3.09s/it, loss=3.06, val_loss=2.620, train_loss=3.060]\n",
669
+ "Epoch 1: 100% 2/2 [00:05<00:00, 2.56s/it, loss=3.06, val_loss=2.620, train_loss=3.060]\n",
670
+ "Validating: 0it [00:00, ?it/s]\u001b[A\n",
671
+ "Validating: 0% 0/1 [00:00<?, ?it/s]\u001b[A\n",
672
+ "Epoch 1: 100% 2/2 [00:06<00:00, 3.31s/it, loss=3.08, val_loss=2.610, train_loss=3.110]\n",
673
+ "Epoch 2: 100% 2/2 [00:05<00:00, 2.72s/it, loss=3.08, val_loss=2.610, train_loss=3.110]\n",
674
+ "Validating: 0it [00:00, ?it/s]\u001b[A\n",
675
+ "Validating: 0% 0/1 [00:00<?, ?it/s]\u001b[A\n",
676
+ "Epoch 2: 100% 2/2 [00:06<00:00, 3.43s/it, loss=3.15, val_loss=2.610, train_loss=3.290]\n",
677
+ "Epoch 3: 100% 2/2 [00:05<00:00, 2.64s/it, loss=3.15, val_loss=2.610, train_loss=3.290]\n",
678
+ "Validating: 0it [00:00, ?it/s]\u001b[A\n",
679
+ "Validating: 0% 0/1 [00:00<?, ?it/s]\u001b[A\n",
680
+ "Epoch 3: 100% 2/2 [00:06<00:00, 3.40s/it, loss=3.07, val_loss=2.610, train_loss=2.830]\n",
681
+ "Epoch 4: 100% 2/2 [00:05<00:00, 2.72s/it, loss=3.07, val_loss=2.610, train_loss=2.830]\n",
682
+ "Validating: 0it [00:00, ?it/s]\u001b[A\n",
683
+ "Validating: 0% 0/1 [00:00<?, ?it/s]\u001b[A\n",
684
+ "Epoch 4: 100% 2/2 [00:06<00:00, 3.49s/it, loss=3.06, val_loss=2.610, train_loss=3.000]\n",
685
+ "Epoch 4: 100% 2/2 [00:19<00:00, 9.72s/it, loss=3.06, val_loss=2.610, train_loss=3.000]\n",
686
+ "Updating lock file 'dvc.lock'\n",
687
+ "\n",
688
+ "Running stage 'eval':\n",
689
+ "> python src/models/evaluate_model.py\n",
690
+ "2021-08-11 01:28:58.833599: I tensorflow/stream_executor/platform/default/dso_loader.cc:53] Successfully opened dynamic library libcudart.so.11.0\n",
691
+ "Global seed set to 42\n",
692
+ "Downloading: 5.61kB [00:00, 6.51MB/s] \n",
693
+ " 0% 0/11 [00:00<?, ?it/s]/usr/local/lib/python3.7/dist-packages/torch/_tensor.py:575: UserWarning: floor_divide is deprecated, and will be removed in a future version of pytorch. It currently rounds toward 0 (like the 'trunc' function NOT 'floor'). This results in incorrect rounding for negative values.\n",
694
+ "To keep the current behavior, use torch.div(a, b, rounding_mode='trunc'), or for actual floor division, use torch.div(a, b, rounding_mode='floor'). (Triggered internally at /pytorch/aten/src/ATen/native/BinaryOps.cpp:467.)\n",
695
+ " return torch.floor_divide(self, other)\n",
696
+ " 9% 1/11 [00:02<00:23, 2.35s/it]Token indices sequence length is longer than the specified maximum sequence length for this model (646 > 512). Running this sequence through the model will result in indexing errors\n",
697
+ "100% 11/11 [00:42<00:00, 3.85s/it]\n",
698
+ "Updating lock file 'dvc.lock'\n",
699
+ "\n",
700
+ "To track the changes with git, run:\n",
701
+ "\n",
702
+ "\tgit add dvc.lock\n",
703
+ "Use `dvc push` to send your updates to remote storage.\n",
704
+ "\u001b[0m"
705
+ ],
706
+ "name": "stdout"
707
+ }
708
+ ]
709
+ },
710
+ {
711
+ "cell_type": "code",
712
+ "metadata": {
713
+ "colab": {
714
+ "base_uri": "https://localhost:8080/"
715
+ },
716
+ "id": "GrjzOTbnzlf_",
717
+ "outputId": "eb72bf20-9f6b-4f53-d4be-c8e328f3fe26"
718
+ },
719
+ "source": [
720
+ "!t5s push"
721
+ ],
722
+ "execution_count": 6,
723
+ "outputs": [
724
+ {
725
+ "output_type": "stream",
726
+ "text": [
727
+ "arguments passed: push\n",
728
+ "/content/summarization\n",
729
+ "dvc push -r origin\n",
730
+ "Uploading: 0% 0/2 [00:00<?, ?file/s{'info': ''}]\n",
731
+ "models/pytorch_model.bin: 0% 0.00/242M [00:00<?, ?it/s]\u001b[A\n",
732
+ "models/pytorch_model.bin: 0% 0.00/242M [00:00<?, ?it/s{'info': ''}]\u001b[A\n",
733
+ "\u001b[31mERROR\u001b[39m: failed to upload '.dvc/cache/5c/e55591940b3086e8e741ce48ef09c3' to 'https://dagshub.com/gagan3012/summarization.dvc/5c/e55591940b3086e8e741ce48ef09c3' - could not perform a POST request\n",
734
+ "\u001b[31mERROR\u001b[39m: failed to upload '.dvc/cache/5f/d59e3c3675d3f3fce7716206d3166d.dir' to 'https://dagshub.com/gagan3012/summarization.dvc/5f/d59e3c3675d3f3fce7716206d3166d.dir'\n",
735
+ "\u001b[31mERROR\u001b[39m: failed to push data to the cloud - 2 files failed to upload\n",
736
+ "\u001b[0mMakefile:42: recipe for target 'push' failed\n",
737
+ "make: *** [push] Error 1\n"
738
+ ],
739
+ "name": "stdout"
740
+ }
741
+ ]
742
+ },
743
+ {
744
+ "cell_type": "code",
745
+ "metadata": {
746
+ "colab": {
747
+ "base_uri": "https://localhost:8080/"
748
+ },
749
+ "id": "AdNmmv9C1Uvg",
750
+ "outputId": "0c7080ef-aafe-4cfa-f95a-539e674b2ce1"
751
+ },
752
+ "source": [
753
+ "!sudo apt-get install git-lfs \n",
754
+ "!t5s push_to_hf_hub"
755
+ ],
756
+ "execution_count": 9,
757
+ "outputs": [
758
+ {
759
+ "output_type": "stream",
760
+ "text": [
761
+ "Reading package lists... Done\n",
762
+ "Building dependency tree \n",
763
+ "Reading state information... Done\n",
764
+ "The following NEW packages will be installed:\n",
765
+ " git-lfs\n",
766
+ "0 upgraded, 1 newly installed, 0 to remove and 40 not upgraded.\n",
767
+ "Need to get 2,129 kB of archives.\n",
768
+ "After this operation, 7,662 kB of additional disk space will be used.\n",
769
+ "Get:1 http://archive.ubuntu.com/ubuntu bionic/universe amd64 git-lfs amd64 2.3.4-1 [2,129 kB]\n",
770
+ "Fetched 2,129 kB in 1s (1,505 kB/s)\n",
771
+ "debconf: unable to initialize frontend: Dialog\n",
772
+ "debconf: (No usable dialog-like program is installed, so the dialog based frontend cannot be used. at /usr/share/perl5/Debconf/FrontEnd/Dialog.pm line 76, <> line 1.)\n",
773
+ "debconf: falling back to frontend: Readline\n",
774
+ "debconf: unable to initialize frontend: Readline\n",
775
+ "debconf: (This frontend requires a controlling tty.)\n",
776
+ "debconf: falling back to frontend: Teletype\n",
777
+ "dpkg-preconfigure: unable to re-open stdin: \n",
778
+ "Selecting previously unselected package git-lfs.\n",
779
+ "(Reading database ... 160837 files and directories currently installed.)\n",
780
+ "Preparing to unpack .../git-lfs_2.3.4-1_amd64.deb ...\n",
781
+ "Unpacking git-lfs (2.3.4-1) ...\n",
782
+ "Setting up git-lfs (2.3.4-1) ...\n",
783
+ "Processing triggers for man-db (2.8.3-2ubuntu0.1) ...\n",
784
+ "arguments passed: push_to_hf_hub\n",
785
+ "/content/summarization\n",
786
+ "dvc repro push_to_hf_hub\n",
787
+ "Stage 'download_data' didn't change, skipping\n",
788
+ "Stage 'process_data' didn't change, skipping\n",
789
+ "Stage 'train' didn't change, skipping\n",
790
+ "Running stage 'push_to_hf_hub':\n",
791
+ "> python src/models/hf_upload.py\n",
792
+ "2021-08-11 01:56:52.485609: I tensorflow/stream_executor/platform/default/dso_loader.cc:53] Successfully opened dynamic library libcudart.so.11.0\n",
793
+ "Global seed set to 42\n",
794
+ "Enter your HuggingFace username:gagan3012\n",
795
+ "Enter your HuggingFace token:\n",
796
+ "Check out your model at:\n",
797
+ "https://huggingface.co/gagan3012/summarsiation/commit/489bebf55d6f0f88e51ef19434d56a997d1c46c0\n",
798
+ "https://huggingface.co/gagan3012/summarsiation\n",
799
+ "Updating lock file 'dvc.lock'\n",
800
+ "\n",
801
+ "To track the changes with git, run:\n",
802
+ "\n",
803
+ "\tgit add dvc.lock\n",
804
+ "Use `dvc push` to send your updates to remote storage.\n",
805
+ "\u001b[0m"
806
+ ],
807
+ "name": "stdout"
808
+ }
809
+ ]
810
+ },
811
+ {
812
+ "cell_type": "code",
813
+ "metadata": {
814
+ "id": "co1DlH-o1tXW"
815
+ },
816
+ "source": [
817
+ ""
818
+ ],
819
+ "execution_count": null,
820
+ "outputs": []
821
+ }
822
+ ]
823
+ }