step 50000
Browse files- .gitattributes +2 -0
- codeparrot_training.py +4 -4
- log/debug_0.log +2 -2
- log/debug_1.log +1 -0
- log/debug_10.log +1 -0
- log/debug_11.log +1 -0
- log/debug_12.log +1 -0
- log/debug_13.log +1 -0
- log/debug_14.log +1 -0
- log/debug_15.log +1 -0
- log/debug_2.log +1 -0
- log/debug_3.log +1 -0
- log/debug_4.log +1 -0
- log/debug_5.log +1 -0
- log/debug_6.log +1 -0
- log/debug_7.log +1 -0
- log/debug_8.log +1 -0
- log/debug_9.log +1 -0
- pytorch_model.bin +1 -1
- runs/Jan14_15-50-40_leandro-16x-a100-b/1642175440.8731604/events.out.tfevents.1642175440.leandro-16x-a100-b.28548.1 +3 -0
- runs/Jan14_15-50-40_leandro-16x-a100-b/events.out.tfevents.1642175440.leandro-16x-a100-b.28548.0 +3 -0
- wandb/debug-internal.log +1 -1
- wandb/debug.log +1 -1
- wandb/latest-run +1 -1
- wandb/run-20220114_155039-1uxxfypf/files/conda-environment.yaml +0 -0
- wandb/run-20220114_155039-1uxxfypf/files/config.yaml +92 -0
- wandb/run-20220114_155039-1uxxfypf/files/output.log +0 -0
- wandb/run-20220114_155039-1uxxfypf/files/requirements.txt +81 -0
- wandb/run-20220114_155039-1uxxfypf/files/wandb-metadata.json +24 -0
- wandb/run-20220114_155039-1uxxfypf/files/wandb-summary.json +1 -0
- wandb/run-20220114_155039-1uxxfypf/logs/debug-internal.log +3 -0
- wandb/run-20220114_155039-1uxxfypf/logs/debug.log +23 -0
- wandb/run-20220114_155039-1uxxfypf/run-1uxxfypf.wandb +3 -0
.gitattributes
CHANGED
@@ -30,3 +30,5 @@ wandb/run-20211111_214446-3xgbgfj2/logs/debug-internal.log filter=lfs diff=lfs m
|
|
30 |
wandb/run-20211111_214446-3xgbgfj2/run-3xgbgfj2.wandb filter=lfs diff=lfs merge=lfs -text
|
31 |
log/debug_0.log filter=lfs diff=lfs merge=lfs -text
|
32 |
wandb/run-20211111_214446-3xgbgfj2/files/output.log filter=lfs diff=lfs merge=lfs -text
|
|
|
|
30 |
wandb/run-20211111_214446-3xgbgfj2/run-3xgbgfj2.wandb filter=lfs diff=lfs merge=lfs -text
|
31 |
log/debug_0.log filter=lfs diff=lfs merge=lfs -text
|
32 |
wandb/run-20211111_214446-3xgbgfj2/files/output.log filter=lfs diff=lfs merge=lfs -text
|
33 |
+
wandb/run-20220114_155039-1uxxfypf/logs/debug-internal.log filter=lfs diff=lfs merge=lfs -text
|
34 |
+
wandb/run-20220114_155039-1uxxfypf/run-1uxxfypf.wandb filter=lfs diff=lfs merge=lfs -text
|
codeparrot_training.py
CHANGED
@@ -66,8 +66,8 @@ def setup_logging(project_name):
|
|
66 |
tb_writer = SummaryWriter()
|
67 |
tb_writer.add_hparams(vars(args), {'0': 0})
|
68 |
logger.setLevel(logging.INFO)
|
69 |
-
datasets.utils.logging.
|
70 |
-
transformers.utils.logging.
|
71 |
else:
|
72 |
tb_writer = None
|
73 |
run_name = ''
|
@@ -129,7 +129,7 @@ config = {"train_batch_size": 2,
|
|
129 |
"valid_batch_size": 2,
|
130 |
"weight_decay": 0.1,
|
131 |
"shuffle_buffer": 1_000,
|
132 |
-
"learning_rate":
|
133 |
"lr_scheduler_type": "cosine",
|
134 |
"num_warmup_steps": 750,
|
135 |
"gradient_accumulation_steps": 16,
|
@@ -205,4 +205,4 @@ accelerator.wait_for_everyone()
|
|
205 |
unwrapped_model = accelerator.unwrap_model(model)
|
206 |
unwrapped_model.save_pretrained("./", save_function=accelerator.save)
|
207 |
if accelerator.is_main_process:
|
208 |
-
hf_repo.push_to_hub(commit_message=f'final model')
|
66 |
tb_writer = SummaryWriter()
|
67 |
tb_writer.add_hparams(vars(args), {'0': 0})
|
68 |
logger.setLevel(logging.INFO)
|
69 |
+
datasets.utils.logging.set_verbosity_warning()
|
70 |
+
transformers.utils.logging.set_verbosity_warning()
|
71 |
else:
|
72 |
tb_writer = None
|
73 |
run_name = ''
|
129 |
"valid_batch_size": 2,
|
130 |
"weight_decay": 0.1,
|
131 |
"shuffle_buffer": 1_000,
|
132 |
+
"learning_rate": 5e-5,
|
133 |
"lr_scheduler_type": "cosine",
|
134 |
"num_warmup_steps": 750,
|
135 |
"gradient_accumulation_steps": 16,
|
205 |
unwrapped_model = accelerator.unwrap_model(model)
|
206 |
unwrapped_model.save_pretrained("./", save_function=accelerator.save)
|
207 |
if accelerator.is_main_process:
|
208 |
+
hf_repo.push_to_hub(commit_message=f'final model')
|
log/debug_0.log
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0475c8ce3fa5b0111ead4e575b0d6b41ddf933c6bccf1374c46bf43f376e83f8
|
3 |
+
size 130284403
|
log/debug_1.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_10.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_11.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_12.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_13.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_14.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_15.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_2.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_3.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_4.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_5.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_6.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_7.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_8.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
log/debug_9.log
CHANGED
@@ -1 +1,2 @@
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
|
1 |
11/11/2021 21:45:50 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
2 |
+
01/14/2022 15:51:31 - INFO - root - Reducer buckets have been rebuilt in this iteration.
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6169094681
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08a8edda980a53bb2df006ea4c632204bac679c41a49159443ef634983dcf03a
|
3 |
size 6169094681
|
runs/Jan14_15-50-40_leandro-16x-a100-b/1642175440.8731604/events.out.tfevents.1642175440.leandro-16x-a100-b.28548.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3500e6cd241c92592124e68388c45a088a9f122c0097e6f123e51f4d74173780
|
3 |
+
size 1438
|
runs/Jan14_15-50-40_leandro-16x-a100-b/events.out.tfevents.1642175440.leandro-16x-a100-b.28548.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18a3d7dfc1bd05e1de4b9b83f86f99705014175418c2c1d563ded9f0144b23bc
|
3 |
+
size 9134099
|
wandb/debug-internal.log
CHANGED
@@ -1 +1 @@
|
|
1 |
-
run-
|
1 |
+
run-20220114_155039-1uxxfypf/logs/debug-internal.log
|
wandb/debug.log
CHANGED
@@ -1 +1 @@
|
|
1 |
-
run-
|
1 |
+
run-20220114_155039-1uxxfypf/logs/debug.log
|
wandb/latest-run
CHANGED
@@ -1 +1 @@
|
|
1 |
-
run-
|
1 |
+
run-20220114_155039-1uxxfypf
|
wandb/run-20220114_155039-1uxxfypf/files/conda-environment.yaml
ADDED
File without changes
|
wandb/run-20220114_155039-1uxxfypf/files/config.yaml
ADDED
@@ -0,0 +1,92 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
wandb_version: 1
|
2 |
+
|
3 |
+
_wandb:
|
4 |
+
desc: null
|
5 |
+
value:
|
6 |
+
cli_version: 0.12.2
|
7 |
+
framework: huggingface
|
8 |
+
huggingface_version: 4.12.2
|
9 |
+
is_jupyter_run: false
|
10 |
+
is_kaggle_kernel: false
|
11 |
+
python_version: 3.8.11
|
12 |
+
start_time: 1642175439
|
13 |
+
t:
|
14 |
+
1:
|
15 |
+
- 1
|
16 |
+
- 11
|
17 |
+
3:
|
18 |
+
- 16
|
19 |
+
4: 3.8.11
|
20 |
+
5: 0.12.2
|
21 |
+
6: 4.12.2
|
22 |
+
8:
|
23 |
+
- 5
|
24 |
+
backend:
|
25 |
+
desc: null
|
26 |
+
value: nccl
|
27 |
+
deepspeed_plugin:
|
28 |
+
desc: null
|
29 |
+
value: None
|
30 |
+
device:
|
31 |
+
desc: null
|
32 |
+
value: cuda:0
|
33 |
+
distributed_type:
|
34 |
+
desc: null
|
35 |
+
value: DistributedType.MULTI_GPU
|
36 |
+
gradient_accumulation_steps:
|
37 |
+
desc: null
|
38 |
+
value: 16
|
39 |
+
gradient_checkpointing:
|
40 |
+
desc: null
|
41 |
+
value: true
|
42 |
+
initialized:
|
43 |
+
desc: null
|
44 |
+
value: 'True'
|
45 |
+
learning_rate:
|
46 |
+
desc: null
|
47 |
+
value: 5.0e-05
|
48 |
+
local_process_index:
|
49 |
+
desc: null
|
50 |
+
value: '0'
|
51 |
+
lr_scheduler_type:
|
52 |
+
desc: null
|
53 |
+
value: cosine
|
54 |
+
max_eval_steps:
|
55 |
+
desc: null
|
56 |
+
value: -1
|
57 |
+
max_train_steps:
|
58 |
+
desc: null
|
59 |
+
value: 50000
|
60 |
+
num_processes:
|
61 |
+
desc: null
|
62 |
+
value: '16'
|
63 |
+
num_warmup_steps:
|
64 |
+
desc: null
|
65 |
+
value: 750
|
66 |
+
process_index:
|
67 |
+
desc: null
|
68 |
+
value: '0'
|
69 |
+
save_checkpoint_steps:
|
70 |
+
desc: null
|
71 |
+
value: 50000
|
72 |
+
seed:
|
73 |
+
desc: null
|
74 |
+
value: 1
|
75 |
+
seq_length:
|
76 |
+
desc: null
|
77 |
+
value: 1024
|
78 |
+
shuffle_buffer:
|
79 |
+
desc: null
|
80 |
+
value: 1000
|
81 |
+
train_batch_size:
|
82 |
+
desc: null
|
83 |
+
value: 2
|
84 |
+
use_fp16:
|
85 |
+
desc: null
|
86 |
+
value: 'True'
|
87 |
+
valid_batch_size:
|
88 |
+
desc: null
|
89 |
+
value: 2
|
90 |
+
weight_decay:
|
91 |
+
desc: null
|
92 |
+
value: 0.1
|
wandb/run-20220114_155039-1uxxfypf/files/output.log
ADDED
The diff for this file is too large to render.
See raw diff
|
wandb/run-20220114_155039-1uxxfypf/files/requirements.txt
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
absl-py==0.13.0
|
2 |
+
accelerate==0.5.1
|
3 |
+
aiohttp==3.7.4.post0
|
4 |
+
async-timeout==3.0.1
|
5 |
+
attrs==21.2.0
|
6 |
+
cachetools==4.2.2
|
7 |
+
certifi==2021.5.30
|
8 |
+
chardet==4.0.0
|
9 |
+
charset-normalizer==2.0.5
|
10 |
+
click==8.0.1
|
11 |
+
configparser==5.0.2
|
12 |
+
datasets==1.13.0
|
13 |
+
deepspeed==0.5.2
|
14 |
+
dill==0.3.4
|
15 |
+
docker-pycreds==0.4.0
|
16 |
+
filelock==3.0.12
|
17 |
+
fsspec==2021.8.1
|
18 |
+
gitdb==4.0.7
|
19 |
+
gitpython==3.1.18
|
20 |
+
google-auth-oauthlib==0.4.6
|
21 |
+
google-auth==1.35.0
|
22 |
+
grpcio==1.40.0
|
23 |
+
huggingface-hub==0.0.19
|
24 |
+
idna==3.2
|
25 |
+
joblib==1.0.1
|
26 |
+
markdown==3.3.4
|
27 |
+
mkl-fft==1.3.0
|
28 |
+
mkl-random==1.2.2
|
29 |
+
mkl-service==2.4.0
|
30 |
+
multidict==5.1.0
|
31 |
+
multiprocess==0.70.12.2
|
32 |
+
ninja==1.10.2
|
33 |
+
numpy==1.20.3
|
34 |
+
oauthlib==3.1.1
|
35 |
+
olefile==0.46
|
36 |
+
packaging==21.0
|
37 |
+
pandas==1.3.3
|
38 |
+
pathtools==0.1.2
|
39 |
+
pillow==8.3.1
|
40 |
+
pip==21.0.1
|
41 |
+
promise==2.3
|
42 |
+
protobuf==3.18.0
|
43 |
+
psutil==5.8.0
|
44 |
+
pyarrow==5.0.0
|
45 |
+
pyasn1-modules==0.2.8
|
46 |
+
pyasn1==0.4.8
|
47 |
+
pyparsing==2.4.7
|
48 |
+
python-dateutil==2.8.2
|
49 |
+
pytz==2021.1
|
50 |
+
pyyaml==5.4.1
|
51 |
+
regex==2021.8.28
|
52 |
+
requests-oauthlib==1.3.0
|
53 |
+
requests==2.26.0
|
54 |
+
rsa==4.7.2
|
55 |
+
sacremoses==0.0.45
|
56 |
+
sentry-sdk==1.3.1
|
57 |
+
setuptools==52.0.0.post20210125
|
58 |
+
shortuuid==1.0.1
|
59 |
+
six==1.16.0
|
60 |
+
smmap==4.0.0
|
61 |
+
subprocess32==3.5.4
|
62 |
+
tensorboard-data-server==0.6.1
|
63 |
+
tensorboard-plugin-wit==1.8.0
|
64 |
+
tensorboard==2.6.0
|
65 |
+
tensorboardx==1.8
|
66 |
+
termcolor==1.1.0
|
67 |
+
tokenizers==0.10.3
|
68 |
+
torch==1.9.0
|
69 |
+
torchaudio==0.9.0a0+33b2469
|
70 |
+
torchvision==0.10.0
|
71 |
+
tqdm==4.62.2
|
72 |
+
transformers==4.12.2
|
73 |
+
triton==1.0.0
|
74 |
+
typing-extensions==3.10.0.0
|
75 |
+
urllib3==1.26.6
|
76 |
+
wandb==0.12.2
|
77 |
+
werkzeug==2.0.1
|
78 |
+
wheel==0.37.0
|
79 |
+
xxhash==2.0.2
|
80 |
+
yarl==1.6.3
|
81 |
+
yaspin==2.1.0
|
wandb/run-20220114_155039-1uxxfypf/files/wandb-metadata.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"os": "Linux-4.19.0-18-cloud-amd64-x86_64-with-glibc2.17",
|
3 |
+
"python": "3.8.11",
|
4 |
+
"heartbeatAt": "2022-01-14T15:50:40.774787",
|
5 |
+
"startedAt": "2022-01-14T15:50:39.945346",
|
6 |
+
"docker": null,
|
7 |
+
"gpu": "A100-SXM4-40GB",
|
8 |
+
"gpu_count": 16,
|
9 |
+
"cpu_count": 96,
|
10 |
+
"cuda": null,
|
11 |
+
"args": [],
|
12 |
+
"state": "running",
|
13 |
+
"program": "codeparrot_training.py",
|
14 |
+
"codePath": "codeparrot_training.py",
|
15 |
+
"git": {
|
16 |
+
"remote": "https://huggingface.co/lvwerra/codeparrot",
|
17 |
+
"commit": "23d07ce28c7ec45049bfe92d9e1b74c0acba62f8"
|
18 |
+
},
|
19 |
+
"email": "leandro.vonwerra@gmail.com",
|
20 |
+
"root": "/home/leandro/codeparrot",
|
21 |
+
"host": "leandro-16x-a100-b",
|
22 |
+
"username": "leandro",
|
23 |
+
"executable": "/home/leandro/miniconda3/envs/codeparrot2/bin/python"
|
24 |
+
}
|
wandb/run-20220114_155039-1uxxfypf/files/wandb-summary.json
ADDED
@@ -0,0 +1 @@
|
|
|
1 |
+
{"lr": 4.9713892916952546e-05, "samples": 1600000, "steps": 3124, "loss/train": 1.10879647731781, "_runtime": 40015, "_timestamp": 1642215454, "_step": 50000, "loss/eval": 1.0396919250488281, "perplexity": 2.828345537185669}
|
wandb/run-20220114_155039-1uxxfypf/logs/debug-internal.log
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7c80e994541bf475850a8692ca0f54fc2e8d575f234abc757fb6353bbe84732
|
3 |
+
size 26892666
|
wandb/run-20220114_155039-1uxxfypf/logs/debug.log
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
2022-01-14 15:50:39,947 INFO MainThread:28548 [wandb_setup.py:_flush():69] setting env: {}
|
2 |
+
2022-01-14 15:50:39,947 INFO MainThread:28548 [wandb_setup.py:_flush():69] setting login settings: {}
|
3 |
+
2022-01-14 15:50:39,947 INFO MainThread:28548 [wandb_init.py:_log_setup():348] Logging user logs to /home/leandro/codeparrot/wandb/run-20220114_155039-1uxxfypf/logs/debug.log
|
4 |
+
2022-01-14 15:50:39,947 INFO MainThread:28548 [wandb_init.py:_log_setup():349] Logging internal logs to /home/leandro/codeparrot/wandb/run-20220114_155039-1uxxfypf/logs/debug-internal.log
|
5 |
+
2022-01-14 15:50:39,947 INFO MainThread:28548 [wandb_init.py:init():381] calling init triggers
|
6 |
+
2022-01-14 15:50:39,948 INFO MainThread:28548 [wandb_init.py:init():386] wandb.init called with sweep_config: {}
|
7 |
+
config: {'train_batch_size': 2, 'valid_batch_size': 2, 'weight_decay': 0.1, 'shuffle_buffer': 1000, 'learning_rate': 5e-05, 'lr_scheduler_type': 'cosine', 'num_warmup_steps': 750, 'gradient_accumulation_steps': 16, 'gradient_checkpointing': True, 'max_train_steps': 50000, 'max_eval_steps': -1, 'seq_length': 1024, 'seed': 1, 'save_checkpoint_steps': 50000, 'backend': 'nccl', 'deepspeed_plugin': 'None', 'distributed_type': 'DistributedType.MULTI_GPU', 'num_processes': '16', 'process_index': '0', 'local_process_index': '0', 'device': 'cuda:0', 'use_fp16': 'True', 'initialized': 'True'}
|
8 |
+
2022-01-14 15:50:39,948 INFO MainThread:28548 [wandb_init.py:init():430] starting backend
|
9 |
+
2022-01-14 15:50:39,948 INFO MainThread:28548 [backend.py:_multiprocessing_setup():70] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
|
10 |
+
2022-01-14 15:50:39,961 INFO MainThread:28548 [backend.py:ensure_launched():135] starting backend process...
|
11 |
+
2022-01-14 15:50:39,970 INFO MainThread:28548 [backend.py:ensure_launched():139] started backend process with pid: 28880
|
12 |
+
2022-01-14 15:50:39,972 INFO MainThread:28548 [wandb_init.py:init():435] backend started and connected
|
13 |
+
2022-01-14 15:50:39,977 INFO MainThread:28548 [wandb_init.py:init():494] updated telemetry
|
14 |
+
2022-01-14 15:50:39,978 INFO MainThread:28548 [wandb_init.py:init():517] communicating current version
|
15 |
+
2022-01-14 15:50:40,637 INFO MainThread:28548 [wandb_init.py:init():522] got version response upgrade_message: "wandb version 0.12.9 is available! To upgrade, please run:\n $ pip install wandb --upgrade"
|
16 |
+
|
17 |
+
2022-01-14 15:50:40,637 INFO MainThread:28548 [wandb_init.py:init():530] communicating run to backend with 30 second timeout
|
18 |
+
2022-01-14 15:50:40,721 INFO MainThread:28548 [wandb_init.py:init():557] starting run threads in backend
|
19 |
+
2022-01-14 15:50:40,860 INFO MainThread:28548 [wandb_run.py:_console_start():1605] atexit reg
|
20 |
+
2022-01-14 15:50:40,861 INFO MainThread:28548 [wandb_run.py:_redirect():1479] redirect: SettingsConsole.REDIRECT
|
21 |
+
2022-01-14 15:50:40,861 INFO MainThread:28548 [wandb_run.py:_redirect():1484] Redirecting console.
|
22 |
+
2022-01-14 15:50:40,865 INFO MainThread:28548 [wandb_run.py:_redirect():1540] Redirects installed.
|
23 |
+
2022-01-14 15:50:40,865 INFO MainThread:28548 [wandb_init.py:init():582] run started, returning control to user process
|
wandb/run-20220114_155039-1uxxfypf/run-1uxxfypf.wandb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48ff5908577eae0523c5d4692a24039eb2f6ee01c42bdc2f1d881bf030f84bf0
|
3 |
+
size 19776992
|