Femboyuwu2000 commited on Apr 11

Commit

f4089ce

•

1 Parent(s): 368b66b

bloomz_bl_story

Browse files

Files changed (21) hide show

.gitattributes +1 -0
README.md +4 -4
adapter_config.json +4 -6
adapter_model.safetensors +2 -2
runs/Apr11_03-48-59_321ddc84c049/events.out.tfevents.1712807923.321ddc84c049.145.0 +3 -0
special_tokens_map.json +15 -4
spiece.model +3 -0
tokenizer.json +0 -0
tokenizer_config.json +27 -10
training_args.bin +1 -1
wandb/debug-internal.log +108 -152
wandb/debug.log +30 -30
wandb/run-20240411_035909-21esl9hl/files/conda-environment.yaml +0 -0
wandb/run-20240411_035909-21esl9hl/files/config.yaml +690 -0
wandb/run-20240411_035909-21esl9hl/files/output.log +103 -0
wandb/run-20240411_035909-21esl9hl/files/requirements.txt +864 -0
wandb/run-20240411_035909-21esl9hl/files/wandb-metadata.json +66 -0
wandb/run-20240411_035909-21esl9hl/files/wandb-summary.json +1 -0
wandb/run-20240411_035909-21esl9hl/logs/debug-internal.log +118 -0
wandb/run-20240411_035909-21esl9hl/logs/debug.log +32 -0
wandb/run-20240411_035909-21esl9hl/run-21esl9hl.wandb +0 -0

.gitattributes CHANGED Viewed

@@ -36,3 +36,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 wandb/run-20240408_203054-ldiuneeg/run-ldiuneeg.wandb filter=lfs diff=lfs merge=lfs -text
 wandb/run-20240410_010250-ft4a6i5j/run-ft4a6i5j.wandb filter=lfs diff=lfs merge=lfs -text
 wandb/run-20240410_115017-r9p6sok2/run-r9p6sok2.wandb filter=lfs diff=lfs merge=lfs -text

 wandb/run-20240408_203054-ldiuneeg/run-ldiuneeg.wandb filter=lfs diff=lfs merge=lfs -text
 wandb/run-20240410_010250-ft4a6i5j/run-ft4a6i5j.wandb filter=lfs diff=lfs merge=lfs -text
 wandb/run-20240410_115017-r9p6sok2/run-r9p6sok2.wandb filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,11 +1,11 @@
 ---
-license: mit
 library_name: peft
 tags:
 - trl
 - sft
 - generated_from_trainer
-base_model: openai-community/gpt2-large
 model-index:
 - name: working
   results: []
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 # working
-This model is a fine-tuned version of [openai-community/gpt2-large](https://huggingface.co/openai-community/gpt2-large) on an unknown dataset.
 ## Model description
@@ -42,7 +42,7 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.03
-- training_steps: 20
 ### Training results

 ---
+license: bigscience-bloom-rail-1.0
 library_name: peft
 tags:
 - trl
 - sft
 - generated_from_trainer
+base_model: bigscience/bloomz-560m
 model-index:
 - name: working
   results: []
 # working
+This model is a fine-tuned version of [bigscience/bloomz-560m](https://huggingface.co/bigscience/bloomz-560m) on an unknown dataset.
 ## Model description
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.03
+- training_steps: 10
 ### Training results

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "openai-community/gpt2-large",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -20,11 +20,9 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "c_fc",
-    "c_attn",
-    "wte",
-    "c_proj",
-    "lm_head"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "bigscience/bloomz-560m",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "lm_head",
+    "query_key_value",
+    "dense_h_to_4h"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e89a7e068c1b8ca512d8f84c288b20473c3e33b72af5e87dbdc4880c81fbaec5
-size 541561408

 version https://git-lfs.github.com/spec/v1
+oid sha256:9baf0d7e0bee813113ef40ed93ff8433a426745af90937aabc260a737c8f5277
+size 1042757704

runs/Apr11_03-48-59_321ddc84c049/events.out.tfevents.1712807923.321ddc84c049.145.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd9ae83ebfcb3f35de03b0cb64494734931fec3a0f8dbe90d9f7ad0f502ddea5
+size 15841

special_tokens_map.json CHANGED Viewed

@@ -1,6 +1,17 @@
 {
-  "bos_token": "<|endoftext|>",
-  "eos_token": "<|endoftext|>",
-  "pad_token": "<|endoftext|>",
-  "unk_token": "<|endoftext|>"
 }

 {
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "</s>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
 }

spiece.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
+size 4309802

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -1,22 +1,39 @@
 {
-  "add_prefix_space": false,
   "added_tokens_decoder": {
-    "50256": {
-      "content": "<|endoftext|>",
       "lstrip": false,
-      "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     }
   },
-  "bos_token": "<|endoftext|>",
   "clean_up_tokenization_spaces": true,
-  "eos_token": "<|endoftext|>",
   "max_length": 1024,
-  "model_max_length": 1024,
-  "pad_token": "<|endoftext|>",
-  "tokenizer_class": "GPT2Tokenizer",
   "truncation": true,
-  "unk_token": "<|endoftext|>"
 }

 {
   "added_tokens_decoder": {
+    "0": {
+      "content": "<pad>",
       "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     }
   },
+  "additional_special_tokens": [],
   "clean_up_tokenization_spaces": true,
+  "eos_token": "</s>",
+  "extra_ids": 0,
   "max_length": 1024,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "</s>",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "T5Tokenizer",
   "truncation": true,
+  "unk_token": "<unk>"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d336504ff1b5fa68adcdc85a42fecf652565e8aad52350e3bded9aa454938008
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:9fcb5d40d27446b473f3cf6a16217747341cc71590de85e4a2a9001a3be0bfca
 size 4920

wandb/debug-internal.log CHANGED Viewed

@@ -1,32 +1,32 @@
-2024-04-11 01:01:03,983 INFO    StreamThr :138 [internal.py:wandb_internal():86] W&B internal server running at pid: 138, started at: 2024-04-11 01:01:03.982415
-2024-04-11 01:01:03,984 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status
-2024-04-11 01:01:04,351 INFO    WriterThread:138 [datastore.py:open_for_write():87] open: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/run-4b3fzolv.wandb
-2024-04-11 01:01:04,352 DEBUG   SenderThread:138 [sender.py:send():379] send: header
-2024-04-11 01:01:04,355 DEBUG   SenderThread:138 [sender.py:send():379] send: run
-2024-04-11 01:01:04,503 INFO    SenderThread:138 [dir_watcher.py:__init__():211] watching files in: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files
-2024-04-11 01:01:04,503 INFO    SenderThread:138 [sender.py:_start_run_threads():1124] run started: 4b3fzolv with start time 1712797263.984466
-2024-04-11 01:01:04,511 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: check_version
-2024-04-11 01:01:04,511 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: check_version
-2024-04-11 01:01:04,599 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: run_start
-2024-04-11 01:01:04,610 DEBUG   HandlerThread:138 [system_info.py:__init__():26] System info init
-2024-04-11 01:01:04,610 DEBUG   HandlerThread:138 [system_info.py:__init__():41] System info init done
-2024-04-11 01:01:04,610 INFO    HandlerThread:138 [system_monitor.py:start():194] Starting system monitor
-2024-04-11 01:01:04,610 INFO    SystemMonitor:138 [system_monitor.py:_start():158] Starting system asset monitoring threads
-2024-04-11 01:01:04,610 INFO    HandlerThread:138 [system_monitor.py:probe():214] Collecting system info
-2024-04-11 01:01:04,611 INFO    SystemMonitor:138 [interfaces.py:start():190] Started cpu monitoring
-2024-04-11 01:01:04,611 INFO    SystemMonitor:138 [interfaces.py:start():190] Started disk monitoring
-2024-04-11 01:01:04,612 INFO    SystemMonitor:138 [interfaces.py:start():190] Started gpu monitoring
-2024-04-11 01:01:04,613 INFO    SystemMonitor:138 [interfaces.py:start():190] Started memory monitoring
-2024-04-11 01:01:04,614 INFO    SystemMonitor:138 [interfaces.py:start():190] Started network monitoring
-2024-04-11 01:01:04,623 DEBUG   HandlerThread:138 [system_info.py:probe():150] Probing system
-2024-04-11 01:01:04,625 DEBUG   HandlerThread:138 [gitlib.py:_init_repo():56] git repository is invalid
-2024-04-11 01:01:04,625 DEBUG   HandlerThread:138 [system_info.py:probe():198] Probing system done
-2024-04-11 01:01:04,626 DEBUG   HandlerThread:138 [system_monitor.py:probe():223] {'os': 'Linux-5.15.133+-x86_64-with-glibc2.31', 'python': '3.10.13', 'heartbeatAt': '2024-04-11T01:01:04.623823', 'startedAt': '2024-04-11T01:01:03.976173', 'docker': None, 'cuda': None, 'args': (), 'state': 'running', 'program': 'kaggle.ipynb', 'codePathLocal': None, 'root': '/kaggle/working', 'host': 'c072b7c9e487', 'username': 'root', 'executable': '/opt/conda/bin/python3.10', 'cpu_count': 2, 'cpu_count_logical': 4, 'cpu_freq': {'current': 2000.188, 'min': 0.0, 'max': 0.0}, 'cpu_freq_per_core': [{'current': 2000.188, 'min': 0.0, 'max': 0.0}, {'current': 2000.188, 'min': 0.0, 'max': 0.0}, {'current': 2000.188, 'min': 0.0, 'max': 0.0}, {'current': 2000.188, 'min': 0.0, 'max': 0.0}], 'disk': {'/': {'total': 8062.387607574463, 'used': 5566.689571380615}}, 'gpu': 'Tesla T4', 'gpu_count': 2, 'gpu_devices': [{'name': 'Tesla T4', 'memory_total': 16106127360}, {'name': 'Tesla T4', 'memory_total': 16106127360}], 'memory': {'total': 31.357559204101562}}
-2024-04-11 01:01:04,626 INFO    HandlerThread:138 [system_monitor.py:probe():224] Finished collecting system info
-2024-04-11 01:01:04,626 INFO    HandlerThread:138 [system_monitor.py:probe():227] Publishing system info
-2024-04-11 01:01:04,626 DEBUG   HandlerThread:138 [system_info.py:_save_conda():207] Saving list of conda packages installed into the current environment
-2024-04-11 01:01:05,505 INFO    Thread-12 :138 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/conda-environment.yaml
-2024-04-11 01:01:19,640 ERROR   HandlerThread:138 [system_info.py:_save_conda():221] Error saving conda packages: Command '['conda', 'env', 'export']' timed out after 15 seconds
 Traceback (most recent call last):
   File "/opt/conda/lib/python3.10/site-packages/wandb/sdk/internal/system/system_info.py", line 214, in _save_conda
     subprocess.call(
@@ -37,126 +37,82 @@ Traceback (most recent call last):
   File "/opt/conda/lib/python3.10/subprocess.py", line 1951, in _wait
     raise TimeoutExpired(self.args, timeout)
 subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after 15 seconds
-2024-04-11 01:01:19,643 DEBUG   HandlerThread:138 [system_info.py:_save_conda():222] Saving conda packages done
-2024-04-11 01:01:19,644 INFO    HandlerThread:138 [system_monitor.py:probe():229] Finished publishing system info
-2024-04-11 01:01:19,652 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:01:19,652 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: keepalive
-2024-04-11 01:01:19,652 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:01:19,653 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: keepalive
-2024-04-11 01:01:19,653 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:01:19,653 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: keepalive
-2024-04-11 01:01:19,653 DEBUG   SenderThread:138 [sender.py:send():379] send: files
-2024-04-11 01:01:19,653 INFO    SenderThread:138 [sender.py:_save_file():1390] saving file wandb-metadata.json with policy now
-2024-04-11 01:01:19,933 INFO    wandb-upload_0:138 [upload_job.py:push():131] Uploaded file /tmp/tmpiqqv1dwfwandb/3d55vshp-wandb-metadata.json
-2024-04-11 01:01:20,508 INFO    Thread-12 :138 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/wandb-metadata.json
-2024-04-11 01:01:20,599 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: python_packages
-2024-04-11 01:01:20,599 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: python_packages
-2024-04-11 01:01:20,602 DEBUG   SenderThread:138 [sender.py:send():379] send: telemetry
-2024-04-11 01:01:20,613 DEBUG   SenderThread:138 [sender.py:send():379] send: config
-2024-04-11 01:01:20,615 DEBUG   SenderThread:138 [sender.py:send():379] send: metric
-2024-04-11 01:01:20,615 DEBUG   SenderThread:138 [sender.py:send():379] send: telemetry
-2024-04-11 01:01:20,615 DEBUG   SenderThread:138 [sender.py:send():379] send: metric
-2024-04-11 01:01:20,615 WARNING SenderThread:138 [sender.py:send_metric():1341] Seen metric with glob (shouldn't happen)
-2024-04-11 01:01:20,616 DEBUG   SenderThread:138 [sender.py:send():379] send: telemetry
-2024-04-11 01:01:20,616 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:01:20,616 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:01:20,617 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:01:21,508 INFO    Thread-12 :138 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/requirements.txt
-2024-04-11 01:01:21,509 INFO    Thread-12 :138 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/output.log
-2024-04-11 01:01:23,509 INFO    Thread-12 :138 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/output.log
-2024-04-11 01:01:25,510 INFO    Thread-12 :138 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/output.log
-2024-04-11 01:01:25,513 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:01:27,511 INFO    Thread-12 :138 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/output.log
-2024-04-11 01:01:30,790 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:01:35,602 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:01:35,603 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:01:35,604 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:01:36,648 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:01:37,515 INFO    Thread-12 :138 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/config.yaml
-2024-04-11 01:01:41,766 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:01:46,767 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:01:50,600 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:01:50,601 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:01:50,640 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:01:52,707 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:01:57,708 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:02,709 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:04,614 DEBUG   SystemMonitor:138 [system_monitor.py:_start():172] Starting system metrics aggregation loop
-2024-04-11 01:02:04,616 DEBUG   SenderThread:138 [sender.py:send():379] send: stats
-2024-04-11 01:02:05,600 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:02:05,601 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:02:05,641 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:02:08,651 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:13,651 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:18,652 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:20,600 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:02:20,601 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:02:20,641 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:02:23,671 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:28,672 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:33,673 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:34,617 DEBUG   SenderThread:138 [sender.py:send():379] send: stats
-2024-04-11 01:02:35,601 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:02:35,601 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:02:35,641 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:02:39,669 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:44,669 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:49,670 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:50,601 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:02:50,601 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:02:50,641 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:02:54,683 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:02:59,684 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:04,618 DEBUG   SenderThread:138 [sender.py:send():379] send: stats
-2024-04-11 01:03:05,601 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:03:05,601 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:03:05,641 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:03:05,668 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:10,669 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:15,670 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:20,601 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:03:20,602 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:03:20,641 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:03:21,658 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:26,659 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:31,660 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:34,619 DEBUG   SenderThread:138 [sender.py:send():379] send: stats
-2024-04-11 01:03:35,601 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:03:35,602 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:03:35,642 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:03:36,661 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:37,017 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: partial_history
-2024-04-11 01:03:37,019 DEBUG   SenderThread:138 [sender.py:send():379] send: metric
-2024-04-11 01:03:37,019 DEBUG   SenderThread:138 [sender.py:send():379] send: metric
-2024-04-11 01:03:37,019 DEBUG   SenderThread:138 [sender.py:send():379] send: metric
-2024-04-11 01:03:37,020 DEBUG   SenderThread:138 [sender.py:send():379] send: metric
-2024-04-11 01:03:37,020 DEBUG   SenderThread:138 [sender.py:send():379] send: history
-2024-04-11 01:03:37,020 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: summary_record
-2024-04-11 01:03:37,020 INFO    SenderThread:138 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
-2024-04-11 01:03:37,559 INFO    Thread-12 :138 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/wandb-summary.json
-2024-04-11 01:03:38,738 DEBUG   SenderThread:138 [sender.py:send():379] send: telemetry
-2024-04-11 01:03:38,738 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: summary_record
-2024-04-11 01:03:38,739 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: partial_history
-2024-04-11 01:03:38,741 INFO    SenderThread:138 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
-2024-04-11 01:03:38,741 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: summary_record
-2024-04-11 01:03:38,741 INFO    SenderThread:138 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
-2024-04-11 01:03:38,742 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: summary_record
-2024-04-11 01:03:38,742 INFO    SenderThread:138 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
-2024-04-11 01:03:38,742 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: summary_record
-2024-04-11 01:03:38,743 INFO    SenderThread:138 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
-2024-04-11 01:03:38,743 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: summary_record
-2024-04-11 01:03:38,743 INFO    SenderThread:138 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
-2024-04-11 01:03:38,744 DEBUG   SenderThread:138 [sender.py:send():379] send: history
-2024-04-11 01:03:38,744 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: summary_record
-2024-04-11 01:03:38,744 INFO    SenderThread:138 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
-2024-04-11 01:03:39,559 INFO    Thread-12 :138 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/wandb-summary.json
-2024-04-11 01:03:39,560 INFO    Thread-12 :138 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/output.log
-2024-04-11 01:03:41,560 INFO    Thread-12 :138 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/output.log
-2024-04-11 01:03:41,871 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:42,561 INFO    Thread-12 :138 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_010103-4b3fzolv/files/config.yaml
-2024-04-11 01:03:46,983 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:50,601 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: stop_status
-2024-04-11 01:03:50,602 DEBUG   SenderThread:138 [sender.py:send_request():406] send_request: stop_status
-2024-04-11 01:03:50,604 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: internal_messages
-2024-04-11 01:03:52,705 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report
-2024-04-11 01:03:57,706 DEBUG   HandlerThread:138 [handler.py:handle_request():146] handle_request: status_report

+2024-04-11 03:59:09,940 INFO    StreamThr :191 [internal.py:wandb_internal():86] W&B internal server running at pid: 191, started at: 2024-04-11 03:59:09.939664
+2024-04-11 03:59:09,941 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status
+2024-04-11 03:59:10,363 INFO    WriterThread:191 [datastore.py:open_for_write():87] open: /kaggle/working/wandb/run-20240411_035909-21esl9hl/run-21esl9hl.wandb
+2024-04-11 03:59:10,364 DEBUG   SenderThread:191 [sender.py:send():379] send: header
+2024-04-11 03:59:10,367 DEBUG   SenderThread:191 [sender.py:send():379] send: run
+2024-04-11 03:59:10,517 INFO    SenderThread:191 [dir_watcher.py:__init__():211] watching files in: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files
+2024-04-11 03:59:10,517 INFO    SenderThread:191 [sender.py:_start_run_threads():1124] run started: 21esl9hl with start time 1712807949.940735
+2024-04-11 03:59:10,526 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: check_version
+2024-04-11 03:59:10,526 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: check_version
+2024-04-11 03:59:10,621 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: run_start
+2024-04-11 03:59:10,635 DEBUG   HandlerThread:191 [system_info.py:__init__():26] System info init
+2024-04-11 03:59:10,635 DEBUG   HandlerThread:191 [system_info.py:__init__():41] System info init done
+2024-04-11 03:59:10,635 INFO    HandlerThread:191 [system_monitor.py:start():194] Starting system monitor
+2024-04-11 03:59:10,635 INFO    SystemMonitor:191 [system_monitor.py:_start():158] Starting system asset monitoring threads
+2024-04-11 03:59:10,635 INFO    HandlerThread:191 [system_monitor.py:probe():214] Collecting system info
+2024-04-11 03:59:10,639 INFO    SystemMonitor:191 [interfaces.py:start():190] Started cpu monitoring
+2024-04-11 03:59:10,640 INFO    SystemMonitor:191 [interfaces.py:start():190] Started disk monitoring
+2024-04-11 03:59:10,644 INFO    SystemMonitor:191 [interfaces.py:start():190] Started gpu monitoring
+2024-04-11 03:59:10,644 INFO    SystemMonitor:191 [interfaces.py:start():190] Started memory monitoring
+2024-04-11 03:59:10,645 INFO    SystemMonitor:191 [interfaces.py:start():190] Started network monitoring
+2024-04-11 03:59:10,650 DEBUG   HandlerThread:191 [system_info.py:probe():150] Probing system
+2024-04-11 03:59:10,652 DEBUG   HandlerThread:191 [gitlib.py:_init_repo():56] git repository is invalid
+2024-04-11 03:59:10,652 DEBUG   HandlerThread:191 [system_info.py:probe():198] Probing system done
+2024-04-11 03:59:10,652 DEBUG   HandlerThread:191 [system_monitor.py:probe():223] {'os': 'Linux-5.15.133+-x86_64-with-glibc2.31', 'python': '3.10.13', 'heartbeatAt': '2024-04-11T03:59:10.650560', 'startedAt': '2024-04-11T03:59:09.933024', 'docker': None, 'cuda': None, 'args': (), 'state': 'running', 'program': 'kaggle.ipynb', 'codePathLocal': None, 'root': '/kaggle/working', 'host': '321ddc84c049', 'username': 'root', 'executable': '/opt/conda/bin/python3.10', 'cpu_count': 2, 'cpu_count_logical': 4, 'cpu_freq': {'current': 2000.19, 'min': 0.0, 'max': 0.0}, 'cpu_freq_per_core': [{'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}], 'disk': {'/': {'total': 8062.387607574463, 'used': 5566.961940765381}}, 'gpu': 'Tesla T4', 'gpu_count': 2, 'gpu_devices': [{'name': 'Tesla T4', 'memory_total': 16106127360}, {'name': 'Tesla T4', 'memory_total': 16106127360}], 'memory': {'total': 31.357559204101562}}
+2024-04-11 03:59:10,653 INFO    HandlerThread:191 [system_monitor.py:probe():224] Finished collecting system info
+2024-04-11 03:59:10,653 INFO    HandlerThread:191 [system_monitor.py:probe():227] Publishing system info
+2024-04-11 03:59:10,653 DEBUG   HandlerThread:191 [system_info.py:_save_conda():207] Saving list of conda packages installed into the current environment
+2024-04-11 03:59:11,520 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/conda-environment.yaml
+2024-04-11 03:59:25,667 ERROR   HandlerThread:191 [system_info.py:_save_conda():221] Error saving conda packages: Command '['conda', 'env', 'export']' timed out after 15 seconds
 Traceback (most recent call last):
   File "/opt/conda/lib/python3.10/site-packages/wandb/sdk/internal/system/system_info.py", line 214, in _save_conda
     subprocess.call(
   File "/opt/conda/lib/python3.10/subprocess.py", line 1951, in _wait
     raise TimeoutExpired(self.args, timeout)
 subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after 15 seconds
+2024-04-11 03:59:25,670 DEBUG   HandlerThread:191 [system_info.py:_save_conda():222] Saving conda packages done
+2024-04-11 03:59:25,671 INFO    HandlerThread:191 [system_monitor.py:probe():229] Finished publishing system info
+2024-04-11 03:59:25,678 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:25,678 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 03:59:25,679 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:25,679 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 03:59:25,679 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:25,679 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 03:59:25,679 DEBUG   SenderThread:191 [sender.py:send():379] send: files
+2024-04-11 03:59:25,680 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-metadata.json with policy now
+2024-04-11 03:59:25,883 INFO    wandb-upload_0:191 [upload_job.py:push():131] Uploaded file /tmp/tmpgmb8demxwandb/zh9coxtl-wandb-metadata.json
+2024-04-11 03:59:26,522 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/wandb-metadata.json
+2024-04-11 03:59:26,714 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: python_packages
+2024-04-11 03:59:26,714 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: python_packages
+2024-04-11 03:59:26,717 DEBUG   SenderThread:191 [sender.py:send():379] send: telemetry
+2024-04-11 03:59:26,727 DEBUG   SenderThread:191 [sender.py:send():379] send: config
+2024-04-11 03:59:26,728 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 03:59:26,729 DEBUG   SenderThread:191 [sender.py:send():379] send: metric
+2024-04-11 03:59:26,729 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 03:59:26,730 DEBUG   SenderThread:191 [sender.py:send():379] send: telemetry
+2024-04-11 03:59:26,731 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 03:59:26,776 DEBUG   SenderThread:191 [sender.py:send():379] send: metric
+2024-04-11 03:59:26,776 WARNING SenderThread:191 [sender.py:send_metric():1341] Seen metric with glob (shouldn't happen)
+2024-04-11 03:59:26,776 DEBUG   SenderThread:191 [sender.py:send():379] send: telemetry
+2024-04-11 03:59:27,522 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/requirements.txt
+2024-04-11 03:59:27,523 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:29,523 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:30,951 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:31,524 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:33,525 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:35,952 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:40,958 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:41,528 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/config.yaml
+2024-04-11 03:59:41,717 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 03:59:41,717 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 03:59:41,718 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 03:59:45,530 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:46,261 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:51,262 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:56,417 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:56,717 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 03:59:56,718 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 03:59:56,719 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 03:59:57,534 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 04:00:01,827 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:06,828 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:08,943 DEBUG   SenderThread:191 [sender.py:send():379] send: telemetry
+2024-04-11 04:00:08,983 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: partial_history
+2024-04-11 04:00:08,985 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,988 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,988 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,989 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,989 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,989 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,989 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,990 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,990 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,990 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,990 DEBUG   SenderThread:191 [sender.py:send():379] send: metric
+2024-04-11 04:00:08,991 DEBUG   SenderThread:191 [sender.py:send():379] send: history
+2024-04-11 04:00:08,991 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,991 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:09,539 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/wandb-summary.json
+2024-04-11 04:00:10,645 DEBUG   SystemMonitor:191 [system_monitor.py:_start():172] Starting system metrics aggregation loop
+2024-04-11 04:00:10,647 DEBUG   SenderThread:191 [sender.py:send():379] send: stats
+2024-04-11 04:00:11,539 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 04:00:11,715 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:00:11,716 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:00:11,719 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:00:11,833 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:12,540 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/config.yaml
+2024-04-11 04:00:16,925 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:21,926 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:26,716 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:00:26,716 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:00:26,757 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:00:27,786 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:32,787 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:37,788 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report

wandb/debug.log CHANGED Viewed

@@ -1,32 +1,32 @@
-2024-04-11 01:01:03,977 INFO    MainThread:94 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_setup.py:_flush():76] Configure stats pid to 94
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_setup.py:_flush():76] Loading settings from /kaggle/working/wandb/settings
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program': '<python with no main file>'}
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_setup.py:_flush():76] Applying login settings: {}
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_setup.py:_flush():76] Applying login settings: {'api_key': '***REDACTED***'}
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_init.py:_log_setup():527] Logging user logs to /kaggle/working/wandb/run-20240411_010103-4b3fzolv/logs/debug.log
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_init.py:_log_setup():528] Logging internal logs to /kaggle/working/wandb/run-20240411_010103-4b3fzolv/logs/debug-internal.log
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_init.py:_jupyter_setup():473] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7bfd48105450>
-2024-04-11 01:01:03,978 INFO    MainThread:94 [wandb_init.py:init():567] calling init triggers
-2024-04-11 01:01:03,979 INFO    MainThread:94 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
 config: {}
-2024-04-11 01:01:03,979 INFO    MainThread:94 [wandb_init.py:init():617] starting backend
-2024-04-11 01:01:03,979 INFO    MainThread:94 [wandb_init.py:init():621] setting up manager
-2024-04-11 01:01:03,980 INFO    MainThread:94 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
-2024-04-11 01:01:03,984 INFO    MainThread:94 [wandb_init.py:init():629] backend started and connected
-2024-04-11 01:01:03,997 INFO    MainThread:94 [wandb_run.py:_label_probe_notebook():1299] probe notebook
-2024-04-11 01:01:04,350 INFO    MainThread:94 [wandb_init.py:init():721] updated telemetry
-2024-04-11 01:01:04,354 INFO    MainThread:94 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
-2024-04-11 01:01:04,510 INFO    MainThread:94 [wandb_run.py:_on_init():2344] communicating current version
-2024-04-11 01:01:04,593 INFO    MainThread:94 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.16.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
-2024-04-11 01:01:04,593 INFO    MainThread:94 [wandb_init.py:init():805] starting run threads in backend
-2024-04-11 01:01:20,600 INFO    MainThread:94 [wandb_run.py:_console_start():2323] atexit reg
-2024-04-11 01:01:20,600 INFO    MainThread:94 [wandb_run.py:_redirect():2178] redirect: wrap_raw
-2024-04-11 01:01:20,601 INFO    MainThread:94 [wandb_run.py:_redirect():2243] Wrapping output streams.
-2024-04-11 01:01:20,601 INFO    MainThread:94 [wandb_run.py:_redirect():2268] Redirects installed.
-2024-04-11 01:01:20,602 INFO    MainThread:94 [wandb_init.py:init():848] run started, returning control to user process
-2024-04-11 01:01:20,608 INFO    MainThread:94 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 50257, 'n_positions': 1024, 'n_embd': 1280, 'n_layer': 36, 'n_head': 20, 'n_inner': None, 'activation_function': 'gelu_new', 'resid_pdrop': 0.1, 'embd_pdrop': 0.1, 'attn_pdrop': 0.1, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'summary_type': 'cls_index', 'summary_use_proj': True, 'summary_activation': None, 'summary_first_dropout': 0.1, 'summary_proj_to_labels': True, 'scale_attn_weights': True, 'use_cache': False, 'scale_attn_by_inverse_layer_idx': False, 'reorder_and_upcast_attn': False, 'bos_token_id': 50256, 'eos_token_id': 50256, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['GPT2LMHeadModel'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': {'text-generation': {'do_sample': True, 'max_length': 50}}, 'problem_type': None, '_name_or_path': 'openai-community/gpt2-large', 'transformers_version': '4.39.3', 'model_type': 'gpt2', 'n_ctx': 1024, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 20, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_00-59-48_c072b7c9e487', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_8bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}

+2024-04-11 03:59:09,934 INFO    MainThread:145 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Configure stats pid to 145
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Loading settings from /kaggle/working/wandb/settings
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program': '<python with no main file>'}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Applying login settings: {}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Applying login settings: {'api_key': '***REDACTED***'}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_init.py:_log_setup():527] Logging user logs to /kaggle/working/wandb/run-20240411_035909-21esl9hl/logs/debug.log
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_init.py:_log_setup():528] Logging internal logs to /kaggle/working/wandb/run-20240411_035909-21esl9hl/logs/debug-internal.log
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_init.py:_jupyter_setup():473] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7e1d3f588970>
+2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():567] calling init triggers
+2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
 config: {}
+2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():617] starting backend
+2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():621] setting up manager
+2024-04-11 03:59:09,938 INFO    MainThread:145 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-04-11 03:59:09,940 INFO    MainThread:145 [wandb_init.py:init():629] backend started and connected
+2024-04-11 03:59:09,953 INFO    MainThread:145 [wandb_run.py:_label_probe_notebook():1299] probe notebook
+2024-04-11 03:59:10,362 INFO    MainThread:145 [wandb_init.py:init():721] updated telemetry
+2024-04-11 03:59:10,366 INFO    MainThread:145 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
+2024-04-11 03:59:10,526 INFO    MainThread:145 [wandb_run.py:_on_init():2344] communicating current version
+2024-04-11 03:59:10,613 INFO    MainThread:145 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.16.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2024-04-11 03:59:10,614 INFO    MainThread:145 [wandb_init.py:init():805] starting run threads in backend
+2024-04-11 03:59:26,715 INFO    MainThread:145 [wandb_run.py:_console_start():2323] atexit reg
+2024-04-11 03:59:26,715 INFO    MainThread:145 [wandb_run.py:_redirect():2178] redirect: wrap_raw
+2024-04-11 03:59:26,716 INFO    MainThread:145 [wandb_run.py:_redirect():2243] Wrapping output streams.
+2024-04-11 03:59:26,716 INFO    MainThread:145 [wandb_run.py:_redirect():2268] Redirects installed.
+2024-04-11 03:59:26,717 INFO    MainThread:145 [wandb_init.py:init():848] run started, returning control to user process
+2024-04-11 03:59:26,723 INFO    MainThread:145 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 250880, 'hidden_size': 1024, 'n_layer': 24, 'n_head': 16, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'use_cache': False, 'pretraining_tp': 1, 'apply_residual_connection_post_layernorm': False, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'bos_token_id': 1, 'eos_token_id': 2, 'slow_but_exact': False, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['BloomForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': 3, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'bigscience/bloomz-560m', 'transformers_version': '4.39.3', 'attention_softmax_in_fp32': True, 'bias_dropout_fusion': True, 'unk_token_id': 0, 'masked_softmax_fusion': True, 'model_type': 'bloom', 'n_inner': None, 'offset_alibi': 100, 'seq_length': 2048, 'skip_bias_add': True, 'skip_bias_add_qkv': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 10, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_03-48-59_321ddc84c049', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_32bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}

wandb/run-20240411_035909-21esl9hl/files/conda-environment.yaml ADDED Viewed

File without changes

wandb/run-20240411_035909-21esl9hl/files/config.yaml ADDED Viewed

	@@ -0,0 +1,690 @@

+wandb_version: 1
+_wandb:
+  desc: null
+  value:
+    python_version: 3.10.13
+    cli_version: 0.16.5
+    framework: huggingface
+    huggingface_version: 4.39.3
+    is_jupyter_run: true
+    is_kaggle_kernel: true
+    start_time: 1712807949.0
+    t:
+      1:
+      - 1
+      - 2
+      - 3
+      - 5
+      - 11
+      - 12
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      - 98
+      - 105
+      2:
+      - 1
+      - 2
+      - 3
+      - 5
+      - 11
+      - 12
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      - 98
+      - 105
+      3:
+      - 7
+      - 23
+      - 62
+      4: 3.10.13
+      5: 0.16.5
+      6: 4.39.3
+      8:
+      - 1
+      - 2
+      - 5
+      9:
+        1: transformers_trainer
+      13: linux-x86_64
+    m:
+    - 1: train/global_step
+      6:
+      - 3
+    - 1: train/epoch
+      5: 1
+      6:
+      - 1
+vocab_size:
+  desc: null
+  value: 250880
+hidden_size:
+  desc: null
+  value: 1024
+n_layer:
+  desc: null
+  value: 24
+n_head:
+  desc: null
+  value: 16
+layer_norm_epsilon:
+  desc: null
+  value: 1.0e-05
+initializer_range:
+  desc: null
+  value: 0.02
+use_cache:
+  desc: null
+  value: false
+pretraining_tp:
+  desc: null
+  value: 1
+apply_residual_connection_post_layernorm:
+  desc: null
+  value: false
+hidden_dropout:
+  desc: null
+  value: 0.0
+attention_dropout:
+  desc: null
+  value: 0.0
+bos_token_id:
+  desc: null
+  value: 1
+eos_token_id:
+  desc: null
+  value: 2
+slow_but_exact:
+  desc: null
+  value: false
+return_dict:
+  desc: null
+  value: true
+output_hidden_states:
+  desc: null
+  value: false
+output_attentions:
+  desc: null
+  value: false
+torchscript:
+  desc: null
+  value: false
+torch_dtype:
+  desc: null
+  value: null
+use_bfloat16:
+  desc: null
+  value: false
+tf_legacy_loss:
+  desc: null
+  value: false
+pruned_heads:
+  desc: null
+  value: {}
+tie_word_embeddings:
+  desc: null
+  value: true
+chunk_size_feed_forward:
+  desc: null
+  value: 0
+is_encoder_decoder:
+  desc: null
+  value: false
+is_decoder:
+  desc: null
+  value: false
+cross_attention_hidden_size:
+  desc: null
+  value: null
+add_cross_attention:
+  desc: null
+  value: false
+tie_encoder_decoder:
+  desc: null
+  value: false
+max_length:
+  desc: null
+  value: 20
+min_length:
+  desc: null
+  value: 0
+do_sample:
+  desc: null
+  value: false
+early_stopping:
+  desc: null
+  value: false
+num_beams:
+  desc: null
+  value: 1
+num_beam_groups:
+  desc: null
+  value: 1
+diversity_penalty:
+  desc: null
+  value: 0.0
+temperature:
+  desc: null
+  value: 1.0
+top_k:
+  desc: null
+  value: 50
+top_p:
+  desc: null
+  value: 1.0
+typical_p:
+  desc: null
+  value: 1.0
+repetition_penalty:
+  desc: null
+  value: 1.0
+length_penalty:
+  desc: null
+  value: 1.0
+no_repeat_ngram_size:
+  desc: null
+  value: 0
+encoder_no_repeat_ngram_size:
+  desc: null
+  value: 0
+bad_words_ids:
+  desc: null
+  value: null
+num_return_sequences:
+  desc: null
+  value: 1
+output_scores:
+  desc: null
+  value: false
+return_dict_in_generate:
+  desc: null
+  value: false
+forced_bos_token_id:
+  desc: null
+  value: null
+forced_eos_token_id:
+  desc: null
+  value: null
+remove_invalid_values:
+  desc: null
+  value: false
+exponential_decay_length_penalty:
+  desc: null
+  value: null
+suppress_tokens:
+  desc: null
+  value: null
+begin_suppress_tokens:
+  desc: null
+  value: null
+architectures:
+  desc: null
+  value:
+  - BloomForCausalLM
+finetuning_task:
+  desc: null
+  value: null
+id2label:
+  desc: null
+  value:
+    '0': LABEL_0
+    '1': LABEL_1
+label2id:
+  desc: null
+  value:
+    LABEL_0: 0
+    LABEL_1: 1
+tokenizer_class:
+  desc: null
+  value: null
+prefix:
+  desc: null
+  value: null
+pad_token_id:
+  desc: null
+  value: 3
+sep_token_id:
+  desc: null
+  value: null
+decoder_start_token_id:
+  desc: null
+  value: null
+task_specific_params:
+  desc: null
+  value: null
+problem_type:
+  desc: null
+  value: null
+_name_or_path:
+  desc: null
+  value: bigscience/bloomz-560m
+transformers_version:
+  desc: null
+  value: 4.39.3
+attention_softmax_in_fp32:
+  desc: null
+  value: true
+bias_dropout_fusion:
+  desc: null
+  value: true
+unk_token_id:
+  desc: null
+  value: 0
+masked_softmax_fusion:
+  desc: null
+  value: true
+model_type:
+  desc: null
+  value: bloom
+n_inner:
+  desc: null
+  value: null
+offset_alibi:
+  desc: null
+  value: 100
+seq_length:
+  desc: null
+  value: 2048
+skip_bias_add:
+  desc: null
+  value: true
+skip_bias_add_qkv:
+  desc: null
+  value: false
+quantization_config:
+  desc: null
+  value:
+    quant_method: QuantizationMethod.BITS_AND_BYTES
+    _load_in_8bit: false
+    _load_in_4bit: true
+    llm_int8_threshold: 6.0
+    llm_int8_skip_modules: null
+    llm_int8_enable_fp32_cpu_offload: false
+    llm_int8_has_fp16_weight: false
+    bnb_4bit_quant_type: nf4
+    bnb_4bit_use_double_quant: false
+    bnb_4bit_compute_dtype: float16
+    bnb_4bit_quant_storage: uint8
+    load_in_4bit: true
+    load_in_8bit: false
+output_dir:
+  desc: null
+  value: /kaggle/working/
+overwrite_output_dir:
+  desc: null
+  value: false
+do_train:
+  desc: null
+  value: false
+do_eval:
+  desc: null
+  value: false
+do_predict:
+  desc: null
+  value: false
+evaluation_strategy:
+  desc: null
+  value: 'no'
+prediction_loss_only:
+  desc: null
+  value: false
+per_device_train_batch_size:
+  desc: null
+  value: 8
+per_device_eval_batch_size:
+  desc: null
+  value: 8
+per_gpu_train_batch_size:
+  desc: null
+  value: null
+per_gpu_eval_batch_size:
+  desc: null
+  value: null
+gradient_accumulation_steps:
+  desc: null
+  value: 1
+eval_accumulation_steps:
+  desc: null
+  value: null
+eval_delay:
+  desc: null
+  value: 0
+learning_rate:
+  desc: null
+  value: 3.0e-05
+weight_decay:
+  desc: null
+  value: 0.0001
+adam_beta1:
+  desc: null
+  value: 0.9
+adam_beta2:
+  desc: null
+  value: 0.999
+adam_epsilon:
+  desc: null
+  value: 1.0e-08
+max_grad_norm:
+  desc: null
+  value: 0.3
+num_train_epochs:
+  desc: null
+  value: 5
+max_steps:
+  desc: null
+  value: 10
+lr_scheduler_type:
+  desc: null
+  value: cosine
+lr_scheduler_kwargs:
+  desc: null
+  value: {}
+warmup_ratio:
+  desc: null
+  value: 0.03
+warmup_steps:
+  desc: null
+  value: 0
+log_level:
+  desc: null
+  value: passive
+log_level_replica:
+  desc: null
+  value: warning
+log_on_each_node:
+  desc: null
+  value: true
+logging_dir:
+  desc: null
+  value: /kaggle/working/runs/Apr11_03-48-59_321ddc84c049
+logging_strategy:
+  desc: null
+  value: steps
+logging_first_step:
+  desc: null
+  value: false
+logging_steps:
+  desc: null
+  value: 20
+logging_nan_inf_filter:
+  desc: null
+  value: true
+save_strategy:
+  desc: null
+  value: steps
+save_steps:
+  desc: null
+  value: 20
+save_total_limit:
+  desc: null
+  value: 1
+save_safetensors:
+  desc: null
+  value: true
+save_on_each_node:
+  desc: null
+  value: false
+save_only_model:
+  desc: null
+  value: false
+no_cuda:
+  desc: null
+  value: false
+use_cpu:
+  desc: null
+  value: false
+use_mps_device:
+  desc: null
+  value: false
+seed:
+  desc: null
+  value: 42
+data_seed:
+  desc: null
+  value: null
+jit_mode_eval:
+  desc: null
+  value: false
+use_ipex:
+  desc: null
+  value: false
+bf16:
+  desc: null
+  value: false
+fp16:
+  desc: null
+  value: false
+fp16_opt_level:
+  desc: null
+  value: O1
+half_precision_backend:
+  desc: null
+  value: auto
+bf16_full_eval:
+  desc: null
+  value: false
+fp16_full_eval:
+  desc: null
+  value: false
+tf32:
+  desc: null
+  value: null
+local_rank:
+  desc: null
+  value: 0
+ddp_backend:
+  desc: null
+  value: null
+tpu_num_cores:
+  desc: null
+  value: null
+tpu_metrics_debug:
+  desc: null
+  value: false
+debug:
+  desc: null
+  value: []
+dataloader_drop_last:
+  desc: null
+  value: false
+eval_steps:
+  desc: null
+  value: null
+dataloader_num_workers:
+  desc: null
+  value: 8
+dataloader_prefetch_factor:
+  desc: null
+  value: null
+past_index:
+  desc: null
+  value: -1
+run_name:
+  desc: null
+  value: /kaggle/working/
+disable_tqdm:
+  desc: null
+  value: false
+remove_unused_columns:
+  desc: null
+  value: true
+label_names:
+  desc: null
+  value: null
+load_best_model_at_end:
+  desc: null
+  value: false
+metric_for_best_model:
+  desc: null
+  value: null
+greater_is_better:
+  desc: null
+  value: null
+ignore_data_skip:
+  desc: null
+  value: false
+fsdp:
+  desc: null
+  value: []
+fsdp_min_num_params:
+  desc: null
+  value: 0
+fsdp_config:
+  desc: null
+  value:
+    min_num_params: 0
+    xla: false
+    xla_fsdp_v2: false
+    xla_fsdp_grad_ckpt: false
+fsdp_transformer_layer_cls_to_wrap:
+  desc: null
+  value: null
+accelerator_config:
+  desc: null
+  value:
+    split_batches: false
+    dispatch_batches: null
+    even_batches: true
+    use_seedable_sampler: true
+deepspeed:
+  desc: null
+  value: null
+label_smoothing_factor:
+  desc: null
+  value: 0.0
+optim:
+  desc: null
+  value: paged_adamw_32bit
+optim_args:
+  desc: null
+  value: null
+adafactor:
+  desc: null
+  value: false
+group_by_length:
+  desc: null
+  value: false
+length_column_name:
+  desc: null
+  value: length
+report_to:
+  desc: null
+  value:
+  - tensorboard
+  - wandb
+ddp_find_unused_parameters:
+  desc: null
+  value: null
+ddp_bucket_cap_mb:
+  desc: null
+  value: null
+ddp_broadcast_buffers:
+  desc: null
+  value: null
+dataloader_pin_memory:
+  desc: null
+  value: true
+dataloader_persistent_workers:
+  desc: null
+  value: false
+skip_memory_metrics:
+  desc: null
+  value: true
+use_legacy_prediction_loop:
+  desc: null
+  value: false
+push_to_hub:
+  desc: null
+  value: false
+resume_from_checkpoint:
+  desc: null
+  value: null
+hub_model_id:
+  desc: null
+  value: null
+hub_strategy:
+  desc: null
+  value: every_save
+hub_token:
+  desc: null
+  value: <HUB_TOKEN>
+hub_private_repo:
+  desc: null
+  value: false
+hub_always_push:
+  desc: null
+  value: false
+gradient_checkpointing:
+  desc: null
+  value: true
+gradient_checkpointing_kwargs:
+  desc: null
+  value: null
+include_inputs_for_metrics:
+  desc: null
+  value: false
+fp16_backend:
+  desc: null
+  value: auto
+push_to_hub_model_id:
+  desc: null
+  value: null
+push_to_hub_organization:
+  desc: null
+  value: null
+push_to_hub_token:
+  desc: null
+  value: <PUSH_TO_HUB_TOKEN>
+mp_parameters:
+  desc: null
+  value: ''
+auto_find_batch_size:
+  desc: null
+  value: true
+full_determinism:
+  desc: null
+  value: false
+torchdynamo:
+  desc: null
+  value: null
+ray_scope:
+  desc: null
+  value: last
+ddp_timeout:
+  desc: null
+  value: 1800
+torch_compile:
+  desc: null
+  value: false
+torch_compile_backend:
+  desc: null
+  value: null
+torch_compile_mode:
+  desc: null
+  value: null
+dispatch_batches:
+  desc: null
+  value: null
+split_batches:
+  desc: null
+  value: null
+include_tokens_per_second:
+  desc: null
+  value: false
+include_num_input_tokens_seen:
+  desc: null
+  value: false
+neftune_noise_alpha:
+  desc: null
+  value: null
+optim_target_modules:
+  desc: null
+  value: null

wandb/run-20240411_035909-21esl9hl/files/output.log ADDED Viewed

	@@ -0,0 +1,103 @@

+/opt/conda/lib/python3.10/site-packages/torch/utils/data/dataloader.py:557: UserWarning: This DataLoader will create 8 worker processes in total. Our suggested max number of worker in current system is 4, which is smaller than what this DataLoader is going to create. Please be aware that excessive worker creation might get DataLoader running slow or even freeze, lower the worker number to avoid potential slowness/freeze if necessary.
+  warnings.warn(_create_warning_msg(
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+/opt/conda/lib/python3.10/site-packages/torch/utils/checkpoint.py:429: UserWarning: torch.utils.checkpoint: please pass in use_reentrant=True or use_reentrant=False explicitly. The default value of use_reentrant will be updated to be False in the future. To maintain current behavior, pass use_reentrant=True. It is recommended that you use use_reentrant=False. Refer to docs for more details on the differences between the two variants.
+  warnings.warn(
+/opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
+  warnings.warn('Was asked to gather along dimension 0, but all '
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
+To disable this warning, you can either:
+	- Avoid using `tokenizers` before the fork if possible
+	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
+/opt/conda/lib/python3.10/site-packages/peft/utils/save_and_load.py:139: UserWarning: Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.

wandb/run-20240411_035909-21esl9hl/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,864 @@

+Babel==2.14.0
+Boruta==0.3
+Brotli==1.0.9
+CVXcanon==0.1.2
+Cartopy==0.22.0
+Cython==3.0.8
+Deprecated==1.2.14
+Farama-Notifications==0.0.4
+Flask==3.0.2
+Geohash==1.0
+GitPython==3.1.41
+ImageHash==4.3.1
+Janome==0.5.0
+Jinja2==3.1.2
+LunarCalendar==0.0.9
+Mako==1.3.2
+Markdown==3.5.2
+MarkupSafe==2.1.3
+MarkupSafe==2.1.5
+Pillow==9.5.0
+PuLP==2.8.0
+PyArabic==0.6.15
+PyJWT==2.8.0
+PyMeeus==0.5.12
+PySocks==1.7.1
+PyUpSet==0.1.1.post7
+PyWavelets==1.5.0
+PyYAML==6.0.1
+Pygments==2.17.2
+Pympler==1.0.1
+QtPy==2.4.1
+Rtree==1.2.0
+SQLAlchemy==2.0.25
+SecretStorage==3.3.3
+Send2Trash==1.8.2
+Shapely==1.8.5.post1
+Shimmy==1.3.0
+SimpleITK==2.3.1
+TPOT==0.12.1
+Theano-PyMC==1.1.2
+Theano==1.0.5
+Wand==0.6.13
+Werkzeug==3.0.2
+absl-py==1.4.0
+accelerate==0.28.0
+access==1.1.9
+affine==2.4.0
+aiobotocore==2.12.2
+aiofiles==22.1.0
+aiohttp-cors==0.7.0
+aiohttp==3.9.1
+aioitertools==0.11.0
+aiorwlock==1.3.0
+aiosignal==1.3.1
+aiosqlite==0.19.0
+albumentations==1.4.0
+alembic==1.13.1
+altair==5.3.0
+annotated-types==0.6.0
+annoy==1.17.3
+anyio==4.2.0
+apache-beam==2.46.0
+aplus==0.11.0
+appdirs==1.4.4
+archspec==0.2.3
+argon2-cffi-bindings==21.2.0
+argon2-cffi==23.1.0
+array-record==0.5.0
+arrow==1.3.0
+arviz==0.17.1
+astroid==3.1.0
+astropy-iers-data==0.2024.4.1.0.33.14
+astropy==6.0.1
+asttokens==2.4.1
+astunparse==1.6.3
+async-lru==2.0.4
+async-timeout==4.0.3
+attrs==23.2.0
+audioread==3.0.1
+autopep8==2.0.4
+backoff==2.2.1
+bayesian-optimization==1.4.3
+beatrix_jupyterlab==2023.128.151533
+beautifulsoup4==4.12.2
+bitsandbytes==0.43.0
+blake3==0.2.1
+bleach==6.1.0
+blessed==1.20.0
+blinker==1.7.0
+blis==0.7.10
+blosc2==2.6.0
+bokeh==3.3.4
+boltons==23.1.1
+boto3==1.26.100
+botocore==1.34.51
+bq_helper==0.4.1
+bqplot==0.12.43
+branca==0.7.1
+brewer2mpl==1.4.1
+brotlipy==0.7.0
+cached-property==1.5.2
+cachetools==4.2.4
+cachetools==5.3.2
+catalogue==2.0.10
+catalyst==22.4
+catboost==1.2.3
+category-encoders==2.6.3
+certifi==2024.2.2
+cesium==0.12.1
+cffi==1.16.0
+charset-normalizer==3.3.2
+chex==0.1.86
+cleverhans==4.0.0
+click-plugins==1.1.1
+click==8.1.7
+cligj==0.7.2
+cloud-tpu-client==0.10
+cloud-tpu-profiler==2.4.0
+cloudpathlib==0.16.0
+cloudpickle==2.2.1
+cloudpickle==3.0.0
+cmdstanpy==1.2.2
+colorama==0.4.6
+colorcet==3.1.0
+colorful==0.5.6
+colorlog==6.8.2
+colorlover==0.3.0
+comm==0.2.1
+conda-libmamba-solver==23.7.0
+conda-package-handling==2.2.0
+conda==23.7.4
+conda_package_streaming==0.9.0
+confection==0.1.4
+contextily==1.6.0
+contourpy==1.2.0
+convertdate==2.4.0
+crcmod==1.7
+cryptography==41.0.7
+cuda-python==12.4.0
+cudf==23.8.0
+cufflinks==0.17.3
+cuml==23.8.0
+cupy==13.0.0
+cycler==0.12.1
+cymem==2.0.8
+cytoolz==0.12.3
+daal4py==2024.2.0
+daal==2024.2.0
+dacite==1.8.1
+dask-cuda==23.8.0
+dask-cudf==23.8.0
+dask-expr==1.0.9
+dask==2024.4.0
+dataclasses-json==0.6.4
+dataproc_jupyter_plugin==0.1.66
+datasets==2.16.0
+datashader==0.16.0
+datatile==1.0.3
+db-dtypes==1.2.0
+deap==1.4.1
+debugpy==1.8.0
+decorator==5.1.1
+deepdiff==6.7.1
+defusedxml==0.7.1
+deprecation==2.1.0
+descartes==1.1.0
+dill==0.3.7
+dipy==1.9.0
+distlib==0.3.8
+distributed==2023.7.1
+distro==1.9.0
+dm-tree==0.1.8
+docker-pycreds==0.4.0
+docker==7.0.0
+docopt==0.6.2
+docstring-parser==0.15
+docstring-to-markdown==0.15
+docutils==0.20.1
+earthengine-api==0.1.395
+easydict==1.13
+easyocr==1.7.1
+ecos==2.0.13
+eli5==0.13.0
+emoji==2.11.0
+en-core-web-lg==3.7.1
+en-core-web-sm==3.7.1
+entrypoints==0.4
+ephem==4.1.5
+esda==2.5.1
+essentia==2.1b6.dev1110
+et-xmlfile==1.1.0
+etils==1.6.0
+exceptiongroup==1.2.0
+executing==2.0.1
+explainable-ai-sdk==1.3.3
+fastai==2.7.14
+fastapi==0.108.0
+fastavro==1.9.3
+fastcore==1.5.29
+fastdownload==0.0.7
+fasteners==0.19
+fastjsonschema==2.19.1
+fastprogress==1.0.3
+fastrlock==0.8.2
+fasttext==0.9.2
+feather-format==0.4.1
+featuretools==1.30.0
+filelock==3.13.1
+fiona==1.9.6
+fitter==1.7.0
+flake8==7.0.0
+flashtext==2.7
+flatbuffers==23.5.26
+flax==0.8.2
+folium==0.16.0
+fonttools==4.47.0
+fonttools==4.50.0
+fqdn==1.5.1
+frozendict==2.4.1
+frozenlist==1.4.1
+fsspec==2023.10.0
+fsspec==2024.3.1
+funcy==2.0
+fury==0.10.0
+future==1.0.0
+fuzzywuzzy==0.18.0
+gast==0.5.4
+gatspy==0.3
+gcsfs==2024.2.0
+gensim==4.3.2
+geographiclib==2.0
+geojson==3.1.0
+geopandas==0.14.3
+geoplot==0.5.1
+geopy==2.4.1
+geoviews==1.11.1
+ggplot==0.11.5
+giddy==2.3.5
+gitdb==4.0.11
+google-ai-generativelanguage==0.4.0
+google-api-core==2.11.1
+google-api-core==2.18.0
+google-api-python-client==2.125.0
+google-apitools==0.5.31
+google-auth-httplib2==0.2.0
+google-auth-oauthlib==1.2.0
+google-auth==2.26.1
+google-cloud-aiplatform==0.6.0a1
+google-cloud-artifact-registry==1.10.0
+google-cloud-automl==1.0.1
+google-cloud-bigquery==2.34.4
+google-cloud-bigtable==1.7.3
+google-cloud-core==2.4.1
+google-cloud-datastore==2.19.0
+google-cloud-dlp==3.14.0
+google-cloud-jupyter-config==0.0.5
+google-cloud-language==2.13.3
+google-cloud-monitoring==2.18.0
+google-cloud-pubsub==2.19.0
+google-cloud-pubsublite==1.9.0
+google-cloud-recommendations-ai==0.7.1
+google-cloud-resource-manager==1.11.0
+google-cloud-spanner==3.40.1
+google-cloud-storage==1.44.0
+google-cloud-translate==3.12.1
+google-cloud-videointelligence==2.13.3
+google-cloud-vision==2.8.0
+google-crc32c==1.5.0
+google-generativeai==0.4.1
+google-pasta==0.2.0
+google-resumable-media==2.7.0
+googleapis-common-protos==1.62.0
+gplearn==0.4.2
+gpustat==1.0.0
+gpxpy==1.6.2
+graphviz==0.20.3
+greenlet==3.0.3
+grpc-google-iam-v1==0.12.7
+grpcio-status==1.48.1
+grpcio-status==1.48.2
+grpcio==1.51.1
+grpcio==1.60.0
+gviz-api==1.10.0
+gym-notices==0.0.8
+gym==0.26.2
+gymnasium==0.29.0
+h11==0.14.0
+h2o==3.46.0.1
+h5netcdf==1.3.0
+h5py==3.10.0
+haversine==2.8.1
+hdfs==2.7.3
+hep-ml==0.7.2
+hijri-converter==2.3.1
+hmmlearn==0.3.2
+holidays==0.24
+holoviews==1.18.3
+hpsklearn==0.1.0
+html5lib==1.1
+htmlmin==0.1.12
+httpcore==1.0.5
+httplib2==0.21.0
+httptools==0.6.1
+httpx==0.27.0
+huggingface-hub==0.22.2
+hunspell==0.5.5
+hydra-slayer==0.5.0
+hyperopt==0.2.7
+hypertools==0.8.0
+idna==3.6
+igraph==0.11.4
+imagecodecs==2024.1.1
+imageio==2.33.1
+imbalanced-learn==0.12.2
+imgaug==0.4.0
+importlib-metadata==6.11.0
+importlib-metadata==7.0.1
+importlib-resources==6.1.1
+inequality==1.0.1
+iniconfig==2.0.0
+ipydatawidgets==4.3.5
+ipykernel==6.28.0
+ipyleaflet==0.18.2
+ipympl==0.7.0
+ipython-genutils==0.2.0
+ipython-genutils==0.2.0
+ipython-sql==0.5.0
+ipython==8.20.0
+ipyvolume==0.6.3
+ipyvue==1.10.2
+ipyvuetify==1.9.3
+ipywebrtc==0.6.0
+ipywidgets==7.7.1
+isoduration==20.11.0
+isort==5.13.2
+isoweek==1.3.3
+itsdangerous==2.1.2
+jaraco.classes==3.3.0
+jax-jumpy==1.0.0
+jax==0.4.23
+jaxlib==0.4.23.dev20240116
+jedi==0.19.1
+jeepney==0.8.0
+jieba==0.42.1
+jmespath==1.0.1
+joblib==1.3.2
+json5==0.9.14
+jsonpatch==1.33
+jsonpointer==2.4
+jsonschema-specifications==2023.12.1
+jsonschema==4.20.0
+jupyter-console==6.6.3
+jupyter-events==0.9.0
+jupyter-http-over-ws==0.0.8
+jupyter-lsp==1.5.1
+jupyter-server-mathjax==0.2.6
+jupyter-ydoc==0.2.5
+jupyter_client==7.4.9
+jupyter_client==8.6.0
+jupyter_core==5.7.1
+jupyter_server==2.13.0
+jupyter_server_fileid==0.9.1
+jupyter_server_proxy==4.1.0
+jupyter_server_terminals==0.5.1
+jupyter_server_ydoc==0.8.0
+jupyterlab-lsp==5.1.0
+jupyterlab-widgets==3.0.9
+jupyterlab==4.1.5
+jupyterlab_git==0.44.0
+jupyterlab_pygments==0.3.0
+jupyterlab_server==2.25.2
+jupytext==1.16.0
+kaggle-environments==1.14.3
+kaggle==1.6.8
+kagglehub==0.2.2
+keras-cv==0.8.2
+keras-nlp==0.8.2
+keras-tuner==1.4.6
+keras==3.1.1
+kernels-mixer==0.0.7
+keyring==24.3.0
+keyrings.google-artifactregistry-auth==1.1.2
+kfp-pipeline-spec==0.2.2
+kfp-server-api==2.0.5
+kfp==2.5.0
+kiwisolver==1.4.5
+kmapper==2.0.1
+kmodes==0.12.2
+korean-lunar-calendar==0.3.1
+kornia==0.7.2
+kornia_rs==0.1.3
+kt-legacy==1.0.5
+kubernetes==26.1.0
+langcodes==3.3.0
+langid==1.1.6
+lazy_loader==0.3
+learntools==0.3.4
+leven==1.0.4
+libclang==16.0.6
+libmambapy==1.5.0
+libpysal==4.9.2
+librosa==0.10.1
+lightgbm==4.2.0
+lightning-utilities==0.11.2
+lime==0.2.0.1
+line-profiler==4.1.2
+linkify-it-py==2.0.3
+llvmlite==0.41.1
+llvmlite==0.42.0
+lml==0.1.0
+locket==1.0.0
+loguru==0.7.2
+lxml==5.2.1
+lz4==4.3.3
+mamba==1.5.0
+mapclassify==2.6.1
+markdown-it-py==3.0.0
+marshmallow==3.21.1
+matplotlib-inline==0.1.6
+matplotlib-venn==0.11.10
+matplotlib==3.7.5
+matplotlib==3.8.3
+mccabe==0.7.0
+mdit-py-plugins==0.4.0
+mdurl==0.1.2
+memory-profiler==0.61.0
+menuinst==2.0.1
+mercantile==1.2.1
+mgwr==2.2.1
+missingno==0.5.2
+mistune==0.8.4
+mizani==0.11.1
+ml-dtypes==0.2.0
+mlcrate==0.2.0
+mlens==0.2.3
+mlxtend==0.23.1
+mne==1.6.1
+mnist==0.2.2
+momepy==0.7.0
+more-itertools==10.2.0
+mpld3==0.5.10
+mpmath==1.3.0
+msgpack==1.0.7
+multidict==6.0.4
+multimethod==1.10
+multipledispatch==1.0.0
+multiprocess==0.70.15
+munkres==1.1.4
+murmurhash==1.0.10
+mypy-extensions==1.0.0
+namex==0.0.7
+nb-conda-kernels==2.3.1
+nb_conda==2.2.1
+nbclassic==1.0.0
+nbclient==0.5.13
+nbconvert==6.4.5
+nbdime==3.2.0
+nbformat==5.9.2
+ndindex==1.8
+nest-asyncio==1.5.8
+networkx==3.2.1
+nibabel==5.2.1
+nilearn==0.10.3
+ninja==1.11.1.1
+nltk==3.2.4
+nose==1.3.7
+notebook==6.5.4
+notebook==6.5.6
+notebook_executor==0.2
+notebook_shim==0.2.3
+numba==0.58.1
+numba==0.59.1
+numexpr==2.10.0
+numpy==1.26.4
+nvidia-ml-py==11.495.46
+nvtx==0.2.10
+oauth2client==4.1.3
+oauthlib==3.2.2
+objsize==0.6.1
+odfpy==1.4.1
+olefile==0.47
+onnx==1.16.0
+opencensus-context==0.1.3
+opencensus==0.11.4
+opencv-contrib-python==4.9.0.80
+opencv-python-headless==4.9.0.80
+opencv-python==4.9.0.80
+openpyxl==3.1.2
+openslide-python==1.3.1
+opentelemetry-api==1.22.0
+opentelemetry-exporter-otlp-proto-common==1.22.0
+opentelemetry-exporter-otlp-proto-grpc==1.22.0
+opentelemetry-exporter-otlp-proto-http==1.22.0
+opentelemetry-exporter-otlp==1.22.0
+opentelemetry-proto==1.22.0
+opentelemetry-sdk==1.22.0
+opentelemetry-semantic-conventions==0.43b0
+opt-einsum==3.3.0
+optax==0.2.2
+optree==0.11.0
+optuna==3.6.1
+orbax-checkpoint==0.5.7
+ordered-set==4.1.0
+orjson==3.9.10
+ortools==9.4.1874
+osmnx==1.9.2
+overrides==7.4.0
+packaging==21.3
+pandas-datareader==0.10.0
+pandas-profiling==3.6.6
+pandas-summary==0.2.0
+pandas==2.1.4
+pandas==2.2.1
+pandasql==0.7.3
+pandocfilters==1.5.0
+panel==1.3.8
+papermill==2.5.0
+param==2.1.0
+parso==0.8.3
+partd==1.4.1
+path.py==12.5.0
+path==16.10.0
+pathos==0.3.2
+pathy==0.10.3
+patsy==0.5.6
+pdf2image==1.17.0
+peft==0.10.0
+pettingzoo==1.24.0
+pexpect==4.8.0
+pexpect==4.9.0
+phik==0.12.4
+pickleshare==0.7.5
+pillow==10.3.0
+pip==23.3.2
+pkgutil_resolve_name==1.3.10
+platformdirs==4.2.0
+plotly-express==0.4.1
+plotly==5.18.0
+plotnine==0.13.4
+pluggy==1.4.0
+pointpats==2.4.0
+polars==0.20.18
+polyglot==16.7.4
+pooch==1.8.1
+pox==0.3.4
+ppca==0.0.4
+ppft==1.7.6.8
+preprocessing==0.1.13
+preshed==3.0.9
+prettytable==3.9.0
+progressbar2==4.4.2
+prometheus-client==0.19.0
+promise==2.3
+prompt-toolkit==3.0.42
+prompt-toolkit==3.0.43
+prophet==1.1.1
+proto-plus==1.23.0
+protobuf==3.20.3
+protobuf==4.21.12
+psutil==5.9.3
+psutil==5.9.7
+ptyprocess==0.7.0
+pudb==2024.1
+pure-eval==0.2.2
+py-cpuinfo==9.0.0
+py-spy==0.3.14
+py4j==0.10.9.7
+pyLDAvis==3.4.1
+pyOpenSSL==23.3.0
+pyaml==23.12.0
+pyarrow-hotfix==0.6
+pyarrow==15.0.2
+pyasn1-modules==0.3.0
+pyasn1==0.5.1
+pybind11==2.12.0
+pyclipper==1.3.0.post5
+pycodestyle==2.11.1
+pycosat==0.6.6
+pycparser==2.21
+pycryptodome==3.20.0
+pyct==0.5.0
+pycuda==2024.1
+pydantic==2.5.3
+pydantic==2.6.4
+pydantic_core==2.14.6
+pydantic_core==2.16.3
+pydegensac==0.1.2
+pydicom==2.4.4
+pydocstyle==6.3.0
+pydot==1.4.2
+pydub==0.25.1
+pyemd==1.0.0
+pyerfa==2.0.1.1
+pyexcel-io==0.6.6
+pyexcel-ods==0.6.0
+pyflakes==3.2.0
+pygltflib==1.16.2
+pykalman==0.9.7
+pylibraft==23.8.0
+pylint==3.1.0
+pymc3==3.11.4
+pymongo==3.13.0
+pynndescent==0.5.12
+pynvml==11.4.1
+pynvrtc==9.2
+pyparsing==3.1.1
+pyparsing==3.1.2
+pypdf==4.1.0
+pyproj==3.6.1
+pysal==24.1
+pyshp==2.3.1
+pytesseract==0.3.10
+pytest==8.1.1
+python-bidi==0.4.2
+python-dateutil==2.9.0.post0
+python-dotenv==1.0.0
+python-json-logger==2.0.7
+python-louvain==0.16
+python-lsp-jsonrpc==1.1.2
+python-lsp-server==1.11.0
+python-slugify==8.0.4
+python-utils==3.8.2
+pythreejs==2.4.2
+pytoolconfig==1.3.1
+pytools==2024.1.1
+pytorch-ignite==0.5.0.post2
+pytorch-lightning==2.2.1
+pytz==2023.3.post1
+pytz==2024.1
+pyu2f==0.1.5
+pyviz_comms==3.0.2
+pyzmq==24.0.1
+pyzmq==25.1.2
+qgrid==1.3.1
+qtconsole==5.5.1
+quantecon==0.7.2
+qudida==0.0.4
+raft-dask==23.8.0
+rasterio==1.3.9
+rasterstats==0.19.0
+ray-cpp==2.9.0
+ray==2.9.0
+referencing==0.32.1
+regex==2023.12.25
+requests-oauthlib==1.3.1
+requests-toolbelt==0.10.1
+requests==2.31.0
+retrying==1.3.3
+retrying==1.3.4
+rfc3339-validator==0.1.4
+rfc3986-validator==0.1.1
+rgf-python==3.12.0
+rich-click==1.7.4
+rich==13.7.0
+rich==13.7.1
+rmm==23.8.0
+rope==1.13.0
+rpds-py==0.16.2
+rsa==4.9
+ruamel-yaml-conda==0.15.100
+ruamel.yaml.clib==0.2.7
+ruamel.yaml==0.17.40
+s2sphere==0.2.5
+s3fs==2024.2.0
+s3transfer==0.6.2
+safetensors==0.4.2
+scattertext==0.1.19
+scikit-image==0.22.0
+scikit-learn-intelex==2024.2.0
+scikit-learn==1.2.2
+scikit-multilearn==0.2.0
+scikit-optimize==0.10.1
+scikit-plot==0.3.7
+scikit-surprise==1.1.3
+scipy==1.11.4
+scipy==1.12.0
+seaborn==0.12.2
+segment_anything==1.0
+segregation==2.5
+semver==3.0.2
+sentencepiece==0.2.0
+sentry-sdk==1.44.1
+setproctitle==1.3.3
+setuptools-git==1.2
+setuptools-scm==8.0.4
+setuptools==69.0.3
+shap==0.44.1
+shapely==2.0.3
+shellingham==1.5.4
+shtab==1.7.1
+simpervisor==1.0.0
+simplejson==3.19.2
+six==1.16.0
+sklearn-pandas==2.2.0
+slicer==0.0.7
+smart-open==6.4.0
+smmap==5.0.1
+sniffio==1.3.0
+snowballstemmer==2.2.0
+snuggs==1.4.7
+sortedcontainers==2.4.0
+soundfile==0.12.1
+soupsieve==2.5
+soxr==0.3.7
+spacy-legacy==3.0.12
+spacy-loggers==1.0.5
+spacy==3.7.2
+spaghetti==1.7.5.post1
+spectral==0.23.1
+spglm==1.1.0
+sphinx-rtd-theme==0.2.4
+spint==1.0.7
+splot==1.1.5.post1
+spopt==0.6.0
+spreg==1.4.2
+spvcm==0.3.0
+sqlparse==0.4.4
+squarify==0.4.3
+srsly==2.4.8
+stable-baselines3==2.1.0
+stack-data==0.6.2
+stack-data==0.6.3
+stanio==0.5.0
+starlette==0.32.0.post1
+statsmodels==0.14.1
+stemming==1.0.1
+stop-words==2018.7.23
+stopit==1.1.2
+stumpy==1.12.0
+sympy==1.12
+tables==3.9.2
+tabulate==0.9.0
+tangled-up-in-unicode==0.2.0
+tbb==2021.12.0
+tblib==3.0.0
+tenacity==8.2.3
+tensorboard-data-server==0.7.2
+tensorboard-plugin-profile==2.15.0
+tensorboard==2.15.1
+tensorboardX==2.6.2.2
+tensorflow-cloud==0.1.16
+tensorflow-datasets==4.9.4
+tensorflow-decision-forests==1.8.1
+tensorflow-estimator==2.15.0
+tensorflow-hub==0.16.1
+tensorflow-io-gcs-filesystem==0.35.0
+tensorflow-io==0.35.0
+tensorflow-metadata==0.14.0
+tensorflow-probability==0.23.0
+tensorflow-serving-api==2.14.1
+tensorflow-text==2.15.0
+tensorflow-transform==0.14.0
+tensorflow==2.15.0
+tensorstore==0.1.56
+termcolor==2.4.0
+terminado==0.18.0
+testpath==0.6.0
+text-unidecode==1.3
+textblob==0.18.0.post0
+texttable==1.7.0
+tf_keras==2.15.1
+tfp-nightly==0.24.0.dev0
+thinc==8.2.2
+threadpoolctl==3.2.0
+tifffile==2023.12.9
+timm==0.9.16
+tinycss2==1.2.1
+tobler==0.11.2
+tokenizers==0.15.2
+toml==0.10.2
+tomli==2.0.1
+tomlkit==0.12.4
+toolz==0.12.1
+torch==2.1.2
+torchaudio==2.1.2
+torchdata==0.7.1
+torchinfo==1.8.0
+torchmetrics==1.3.2
+torchtext==0.16.2
+torchvision==0.16.2
+tornado==6.3.3
+tqdm==4.66.1
+traceml==1.0.8
+traitlets==5.9.0
+traittypes==0.2.1
+transformers==4.39.3
+treelite-runtime==3.2.0
+treelite==3.2.0
+trl==0.8.1
+truststore==0.8.0
+trx-python==0.2.9
+tsfresh==0.20.2
+typeguard==4.1.5
+typer==0.9.0
+typer==0.9.4
+types-python-dateutil==2.8.19.20240106
+typing-inspect==0.9.0
+typing-utils==0.1.0
+typing_extensions==4.9.0
+tyro==0.8.3
+tzdata==2023.4
+uc-micro-py==1.0.3
+ucx-py==0.33.0
+ujson==5.9.0
+umap-learn==0.5.5
+unicodedata2==15.1.0
+update-checker==0.18.0
+uri-template==1.3.0
+uritemplate==3.0.1
+urllib3==1.26.18
+urllib3==2.1.0
+urwid==2.6.10
+urwid_readline==0.14
+uvicorn==0.25.0
+uvloop==0.19.0
+vaex-astro==0.9.3
+vaex-core==4.17.1
+vaex-hdf5==0.14.1
+vaex-jupyter==0.8.2
+vaex-ml==0.18.3
+vaex-server==0.9.0
+vaex-viz==0.5.4
+vaex==4.17.0
+vec_noise==1.1.4
+vecstack==0.4.0
+virtualenv==20.21.0
+visions==0.7.5
+vowpalwabbit==9.9.0
+vtk==9.3.0
+wandb==0.16.5
+wasabi==1.1.2
+watchfiles==0.21.0
+wavio==0.0.8
+wcwidth==0.2.13
+weasel==0.3.4
+webcolors==1.13
+webencodings==0.5.1
+websocket-client==1.7.0
+websockets==12.0
+wfdb==4.1.2
+whatthepatch==1.0.5
+wheel==0.42.0
+widgetsnbextension==3.6.6
+witwidget==1.8.1
+woodwork==0.29.0
+wordcloud==1.9.3
+wordsegment==1.3.1
+wrapt==1.14.1
+xarray-einstats==0.7.0
+xarray==2024.3.0
+xgboost==2.0.3
+xvfbwrapper==0.2.9
+xxhash==3.4.1
+xyzservices==2023.10.1
+y-py==0.6.2
+yapf==0.40.2
+yarl==1.9.3
+yarl==1.9.4
+ydata-profiling==4.6.4
+yellowbrick==1.5
+ypy-websocket==0.8.4
+zict==3.0.0
+zipp==3.17.0
+zstandard==0.22.0

wandb/run-20240411_035909-21esl9hl/files/wandb-metadata.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+    "os": "Linux-5.15.133+-x86_64-with-glibc2.31",
+    "python": "3.10.13",
+    "heartbeatAt": "2024-04-11T03:59:10.650560",
+    "startedAt": "2024-04-11T03:59:09.933024",
+    "docker": null,
+    "cuda": null,
+    "args": [],
+    "state": "running",
+    "program": "kaggle.ipynb",
+    "codePathLocal": null,
+    "root": "/kaggle/working",
+    "host": "321ddc84c049",
+    "username": "root",
+    "executable": "/opt/conda/bin/python3.10",
+    "cpu_count": 2,
+    "cpu_count_logical": 4,
+    "cpu_freq": {
+        "current": 2000.19,
+        "min": 0.0,
+        "max": 0.0
+    },
+    "cpu_freq_per_core": [
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        }
+    ],
+    "disk": {
+        "/": {
+            "total": 8062.387607574463,
+            "used": 5566.961940765381
+        }
+    },
+    "gpu": "Tesla T4",
+    "gpu_count": 2,
+    "gpu_devices": [
+        {
+            "name": "Tesla T4",
+            "memory_total": 16106127360
+        },
+        {
+            "name": "Tesla T4",
+            "memory_total": 16106127360
+        }
+    ],
+    "memory": {
+        "total": 31.357559204101562
+    }
+}

wandb/run-20240411_035909-21esl9hl/files/wandb-summary.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"train_runtime": 14.0567, "train_samples_per_second": 2.846, "train_steps_per_second": 0.711, "total_flos": 28907911741440.0, "train_loss": 21.220675659179687, "train/epoch": 0.0, "train/global_step": 10, "_timestamp": 1712808008.9437401, "_runtime": 59.003005027770996, "_step": 0}

wandb/run-20240411_035909-21esl9hl/logs/debug-internal.log ADDED Viewed

	@@ -0,0 +1,118 @@

+2024-04-11 03:59:09,940 INFO    StreamThr :191 [internal.py:wandb_internal():86] W&B internal server running at pid: 191, started at: 2024-04-11 03:59:09.939664
+2024-04-11 03:59:09,941 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status
+2024-04-11 03:59:10,363 INFO    WriterThread:191 [datastore.py:open_for_write():87] open: /kaggle/working/wandb/run-20240411_035909-21esl9hl/run-21esl9hl.wandb
+2024-04-11 03:59:10,364 DEBUG   SenderThread:191 [sender.py:send():379] send: header
+2024-04-11 03:59:10,367 DEBUG   SenderThread:191 [sender.py:send():379] send: run
+2024-04-11 03:59:10,517 INFO    SenderThread:191 [dir_watcher.py:__init__():211] watching files in: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files
+2024-04-11 03:59:10,517 INFO    SenderThread:191 [sender.py:_start_run_threads():1124] run started: 21esl9hl with start time 1712807949.940735
+2024-04-11 03:59:10,526 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: check_version
+2024-04-11 03:59:10,526 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: check_version
+2024-04-11 03:59:10,621 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: run_start
+2024-04-11 03:59:10,635 DEBUG   HandlerThread:191 [system_info.py:__init__():26] System info init
+2024-04-11 03:59:10,635 DEBUG   HandlerThread:191 [system_info.py:__init__():41] System info init done
+2024-04-11 03:59:10,635 INFO    HandlerThread:191 [system_monitor.py:start():194] Starting system monitor
+2024-04-11 03:59:10,635 INFO    SystemMonitor:191 [system_monitor.py:_start():158] Starting system asset monitoring threads
+2024-04-11 03:59:10,635 INFO    HandlerThread:191 [system_monitor.py:probe():214] Collecting system info
+2024-04-11 03:59:10,639 INFO    SystemMonitor:191 [interfaces.py:start():190] Started cpu monitoring
+2024-04-11 03:59:10,640 INFO    SystemMonitor:191 [interfaces.py:start():190] Started disk monitoring
+2024-04-11 03:59:10,644 INFO    SystemMonitor:191 [interfaces.py:start():190] Started gpu monitoring
+2024-04-11 03:59:10,644 INFO    SystemMonitor:191 [interfaces.py:start():190] Started memory monitoring
+2024-04-11 03:59:10,645 INFO    SystemMonitor:191 [interfaces.py:start():190] Started network monitoring
+2024-04-11 03:59:10,650 DEBUG   HandlerThread:191 [system_info.py:probe():150] Probing system
+2024-04-11 03:59:10,652 DEBUG   HandlerThread:191 [gitlib.py:_init_repo():56] git repository is invalid
+2024-04-11 03:59:10,652 DEBUG   HandlerThread:191 [system_info.py:probe():198] Probing system done
+2024-04-11 03:59:10,652 DEBUG   HandlerThread:191 [system_monitor.py:probe():223] {'os': 'Linux-5.15.133+-x86_64-with-glibc2.31', 'python': '3.10.13', 'heartbeatAt': '2024-04-11T03:59:10.650560', 'startedAt': '2024-04-11T03:59:09.933024', 'docker': None, 'cuda': None, 'args': (), 'state': 'running', 'program': 'kaggle.ipynb', 'codePathLocal': None, 'root': '/kaggle/working', 'host': '321ddc84c049', 'username': 'root', 'executable': '/opt/conda/bin/python3.10', 'cpu_count': 2, 'cpu_count_logical': 4, 'cpu_freq': {'current': 2000.19, 'min': 0.0, 'max': 0.0}, 'cpu_freq_per_core': [{'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}], 'disk': {'/': {'total': 8062.387607574463, 'used': 5566.961940765381}}, 'gpu': 'Tesla T4', 'gpu_count': 2, 'gpu_devices': [{'name': 'Tesla T4', 'memory_total': 16106127360}, {'name': 'Tesla T4', 'memory_total': 16106127360}], 'memory': {'total': 31.357559204101562}}
+2024-04-11 03:59:10,653 INFO    HandlerThread:191 [system_monitor.py:probe():224] Finished collecting system info
+2024-04-11 03:59:10,653 INFO    HandlerThread:191 [system_monitor.py:probe():227] Publishing system info
+2024-04-11 03:59:10,653 DEBUG   HandlerThread:191 [system_info.py:_save_conda():207] Saving list of conda packages installed into the current environment
+2024-04-11 03:59:11,520 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/conda-environment.yaml
+2024-04-11 03:59:25,667 ERROR   HandlerThread:191 [system_info.py:_save_conda():221] Error saving conda packages: Command '['conda', 'env', 'export']' timed out after 15 seconds
+Traceback (most recent call last):
+  File "/opt/conda/lib/python3.10/site-packages/wandb/sdk/internal/system/system_info.py", line 214, in _save_conda
+    subprocess.call(
+  File "/opt/conda/lib/python3.10/subprocess.py", line 347, in call
+    return p.wait(timeout=timeout)
+  File "/opt/conda/lib/python3.10/subprocess.py", line 1209, in wait
+    return self._wait(timeout=timeout)
+  File "/opt/conda/lib/python3.10/subprocess.py", line 1951, in _wait
+    raise TimeoutExpired(self.args, timeout)
+subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after 15 seconds
+2024-04-11 03:59:25,670 DEBUG   HandlerThread:191 [system_info.py:_save_conda():222] Saving conda packages done
+2024-04-11 03:59:25,671 INFO    HandlerThread:191 [system_monitor.py:probe():229] Finished publishing system info
+2024-04-11 03:59:25,678 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:25,678 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 03:59:25,679 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:25,679 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 03:59:25,679 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:25,679 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 03:59:25,679 DEBUG   SenderThread:191 [sender.py:send():379] send: files
+2024-04-11 03:59:25,680 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-metadata.json with policy now
+2024-04-11 03:59:25,883 INFO    wandb-upload_0:191 [upload_job.py:push():131] Uploaded file /tmp/tmpgmb8demxwandb/zh9coxtl-wandb-metadata.json
+2024-04-11 03:59:26,522 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/wandb-metadata.json
+2024-04-11 03:59:26,714 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: python_packages
+2024-04-11 03:59:26,714 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: python_packages
+2024-04-11 03:59:26,717 DEBUG   SenderThread:191 [sender.py:send():379] send: telemetry
+2024-04-11 03:59:26,727 DEBUG   SenderThread:191 [sender.py:send():379] send: config
+2024-04-11 03:59:26,728 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 03:59:26,729 DEBUG   SenderThread:191 [sender.py:send():379] send: metric
+2024-04-11 03:59:26,729 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 03:59:26,730 DEBUG   SenderThread:191 [sender.py:send():379] send: telemetry
+2024-04-11 03:59:26,731 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 03:59:26,776 DEBUG   SenderThread:191 [sender.py:send():379] send: metric
+2024-04-11 03:59:26,776 WARNING SenderThread:191 [sender.py:send_metric():1341] Seen metric with glob (shouldn't happen)
+2024-04-11 03:59:26,776 DEBUG   SenderThread:191 [sender.py:send():379] send: telemetry
+2024-04-11 03:59:27,522 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/requirements.txt
+2024-04-11 03:59:27,523 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:29,523 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:30,951 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:31,524 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:33,525 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:35,952 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:40,958 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:41,528 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/config.yaml
+2024-04-11 03:59:41,717 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 03:59:41,717 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 03:59:41,718 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 03:59:45,530 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 03:59:46,261 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:51,262 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:56,417 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 03:59:56,717 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 03:59:56,718 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 03:59:56,719 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 03:59:57,534 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 04:00:01,827 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:06,828 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:08,943 DEBUG   SenderThread:191 [sender.py:send():379] send: telemetry
+2024-04-11 04:00:08,983 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: partial_history
+2024-04-11 04:00:08,985 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,988 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,988 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,989 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,989 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,989 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,989 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,990 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,990 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,990 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:08,990 DEBUG   SenderThread:191 [sender.py:send():379] send: metric
+2024-04-11 04:00:08,991 DEBUG   SenderThread:191 [sender.py:send():379] send: history
+2024-04-11 04:00:08,991 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:00:08,991 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:00:09,539 INFO    Thread-12 :191 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/wandb-summary.json
+2024-04-11 04:00:10,645 DEBUG   SystemMonitor:191 [system_monitor.py:_start():172] Starting system metrics aggregation loop
+2024-04-11 04:00:10,647 DEBUG   SenderThread:191 [sender.py:send():379] send: stats
+2024-04-11 04:00:11,539 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 04:00:11,715 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:00:11,716 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:00:11,719 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:00:11,833 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:12,540 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/config.yaml
+2024-04-11 04:00:16,925 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:21,926 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:26,716 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:00:26,716 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:00:26,757 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:00:27,786 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:32,787 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:37,788 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report

wandb/run-20240411_035909-21esl9hl/logs/debug.log ADDED Viewed

	@@ -0,0 +1,32 @@

+2024-04-11 03:59:09,934 INFO    MainThread:145 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Configure stats pid to 145
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Loading settings from /kaggle/working/wandb/settings
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program': '<python with no main file>'}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Applying login settings: {}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Applying login settings: {'api_key': '***REDACTED***'}
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_init.py:_log_setup():527] Logging user logs to /kaggle/working/wandb/run-20240411_035909-21esl9hl/logs/debug.log
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_init.py:_log_setup():528] Logging internal logs to /kaggle/working/wandb/run-20240411_035909-21esl9hl/logs/debug-internal.log
+2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_init.py:_jupyter_setup():473] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7e1d3f588970>
+2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():567] calling init triggers
+2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
+config: {}
+2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():617] starting backend
+2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():621] setting up manager
+2024-04-11 03:59:09,938 INFO    MainThread:145 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-04-11 03:59:09,940 INFO    MainThread:145 [wandb_init.py:init():629] backend started and connected
+2024-04-11 03:59:09,953 INFO    MainThread:145 [wandb_run.py:_label_probe_notebook():1299] probe notebook
+2024-04-11 03:59:10,362 INFO    MainThread:145 [wandb_init.py:init():721] updated telemetry
+2024-04-11 03:59:10,366 INFO    MainThread:145 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
+2024-04-11 03:59:10,526 INFO    MainThread:145 [wandb_run.py:_on_init():2344] communicating current version
+2024-04-11 03:59:10,613 INFO    MainThread:145 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.16.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2024-04-11 03:59:10,614 INFO    MainThread:145 [wandb_init.py:init():805] starting run threads in backend
+2024-04-11 03:59:26,715 INFO    MainThread:145 [wandb_run.py:_console_start():2323] atexit reg
+2024-04-11 03:59:26,715 INFO    MainThread:145 [wandb_run.py:_redirect():2178] redirect: wrap_raw
+2024-04-11 03:59:26,716 INFO    MainThread:145 [wandb_run.py:_redirect():2243] Wrapping output streams.
+2024-04-11 03:59:26,716 INFO    MainThread:145 [wandb_run.py:_redirect():2268] Redirects installed.
+2024-04-11 03:59:26,717 INFO    MainThread:145 [wandb_init.py:init():848] run started, returning control to user process
+2024-04-11 03:59:26,723 INFO    MainThread:145 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 250880, 'hidden_size': 1024, 'n_layer': 24, 'n_head': 16, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'use_cache': False, 'pretraining_tp': 1, 'apply_residual_connection_post_layernorm': False, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'bos_token_id': 1, 'eos_token_id': 2, 'slow_but_exact': False, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['BloomForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': 3, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'bigscience/bloomz-560m', 'transformers_version': '4.39.3', 'attention_softmax_in_fp32': True, 'bias_dropout_fusion': True, 'unk_token_id': 0, 'masked_softmax_fusion': True, 'model_type': 'bloom', 'n_inner': None, 'offset_alibi': 100, 'seq_length': 2048, 'skip_bias_add': True, 'skip_bias_add_qkv': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 10, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_03-48-59_321ddc84c049', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_32bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}

wandb/run-20240411_035909-21esl9hl/run-21esl9hl.wandb ADDED Viewed

Binary file (18.5 kB). View file