Femboyuwu2000 commited on Apr 11, 2024

Commit

5415c3f

•

1 Parent(s): f4089ce

bloomz_bl_story

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +1 -0
README.md +1 -1
adapter_config.json +1 -1
adapter_model.safetensors +1 -1
bloomz_dam_my/README.md +202 -0
bloomz_dam_my/adapter_config.json +30 -0
bloomz_dam_my/adapter_model.safetensors +3 -0
bloomz_dam_my/special_tokens_map.json +17 -0
bloomz_dam_my/spiece.model +3 -0
bloomz_dam_my/tokenizer.json +3 -0
bloomz_dam_my/tokenizer_config.json +39 -0
bloomz_dam_my/training_args.bin +3 -0
runs/Apr11_04-02-02_321ddc84c049/events.out.tfevents.1712808126.321ddc84c049.414.0 +3 -0
runs/Apr11_04-04-49_321ddc84c049/events.out.tfevents.1712808294.321ddc84c049.740.0 +3 -0
runs/Apr11_04-07-17_321ddc84c049/events.out.tfevents.1712808441.321ddc84c049.1050.0 +3 -0
tokenizer.json +2 -2
training_args.bin +1 -1
wandb/debug-internal.log +0 -0
wandb/debug.log +29 -30
wandb/run-20240411_035909-21esl9hl/files/output.log +1 -0
wandb/run-20240411_035909-21esl9hl/files/wandb-summary.json +1 -1
wandb/run-20240411_035909-21esl9hl/logs/debug-internal.log +158 -0
wandb/run-20240411_035909-21esl9hl/logs/debug.log +2 -0
wandb/run-20240411_035909-21esl9hl/run-21esl9hl.wandb +0 -0
wandb/run-20240411_040208-txpa3x4k/files/conda-environment.yaml +0 -0
wandb/run-20240411_040208-txpa3x4k/files/config.yaml +701 -0
wandb/run-20240411_040208-txpa3x4k/files/output.log +18 -0
wandb/run-20240411_040208-txpa3x4k/files/requirements.txt +864 -0
wandb/run-20240411_040208-txpa3x4k/files/wandb-metadata.json +66 -0
wandb/run-20240411_040208-txpa3x4k/files/wandb-summary.json +1 -0
wandb/run-20240411_040208-txpa3x4k/logs/debug-internal.log +273 -0
wandb/run-20240411_040208-txpa3x4k/logs/debug.log +33 -0
wandb/run-20240411_040208-txpa3x4k/run-txpa3x4k.wandb +0 -0
wandb/run-20240411_040455-4dprer7c/files/conda-environment.yaml +0 -0
wandb/run-20240411_040455-4dprer7c/files/config.yaml +701 -0
wandb/run-20240411_040455-4dprer7c/files/output.log +12 -0
wandb/run-20240411_040455-4dprer7c/files/requirements.txt +864 -0
wandb/run-20240411_040455-4dprer7c/files/wandb-metadata.json +66 -0
wandb/run-20240411_040455-4dprer7c/files/wandb-summary.json +1 -0
wandb/run-20240411_040455-4dprer7c/logs/debug-internal.log +254 -0
wandb/run-20240411_040455-4dprer7c/logs/debug.log +33 -0
wandb/run-20240411_040455-4dprer7c/run-4dprer7c.wandb +0 -0
wandb/run-20240411_040722-rimyh9a1/files/conda-environment.yaml +0 -0
wandb/run-20240411_040722-rimyh9a1/files/config.yaml +702 -0
wandb/run-20240411_040722-rimyh9a1/files/output.log +0 -0
wandb/run-20240411_040722-rimyh9a1/files/requirements.txt +864 -0
wandb/run-20240411_040722-rimyh9a1/files/wandb-metadata.json +66 -0
wandb/run-20240411_040722-rimyh9a1/files/wandb-summary.json +1 -0
wandb/run-20240411_040722-rimyh9a1/logs/debug-internal.log +0 -0
wandb/run-20240411_040722-rimyh9a1/logs/debug.log +31 -0

.gitattributes CHANGED Viewed

@@ -37,3 +37,4 @@ wandb/run-20240408_203054-ldiuneeg/run-ldiuneeg.wandb filter=lfs diff=lfs merge=
 wandb/run-20240410_010250-ft4a6i5j/run-ft4a6i5j.wandb filter=lfs diff=lfs merge=lfs -text
 wandb/run-20240410_115017-r9p6sok2/run-r9p6sok2.wandb filter=lfs diff=lfs merge=lfs -text
 tokenizer.json filter=lfs diff=lfs merge=lfs -text

 wandb/run-20240410_010250-ft4a6i5j/run-ft4a6i5j.wandb filter=lfs diff=lfs merge=lfs -text
 wandb/run-20240410_115017-r9p6sok2/run-r9p6sok2.wandb filter=lfs diff=lfs merge=lfs -text
 tokenizer.json filter=lfs diff=lfs merge=lfs -text
+wandb/run-20240411_040722-rimyh9a1/run-rimyh9a1.wandb filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -42,7 +42,7 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.03
-- training_steps: 10
 ### Training results

 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.03
+- training_steps: 20000
 ### Training results

adapter_config.json CHANGED Viewed

@@ -20,8 +20,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "lm_head",
     "query_key_value",
     "dense_h_to_4h"
   ],
   "task_type": "CAUSAL_LM",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "query_key_value",
+    "lm_head",
     "dense_h_to_4h"
   ],
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9baf0d7e0bee813113ef40ed93ff8433a426745af90937aabc260a737c8f5277
 size 1042757704

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ac730ac4465d0ec9fbe49ed9c5ad2a69ec11ddf9dc1d9cb0f5595f60817af39
 size 1042757704

bloomz_dam_my/README.md ADDED Viewed

	@@ -0,0 +1,202 @@

+---
+library_name: peft
+base_model: bigscience/bloomz-560m
+---
+# Model Card for Model ID
+<!-- Provide a quick summary of what the model is/does. -->
+## Model Details
+### Model Description
+<!-- Provide a longer summary of what this model is. -->
+- **Developed by:** [More Information Needed]
+- **Funded by [optional]:** [More Information Needed]
+- **Shared by [optional]:** [More Information Needed]
+- **Model type:** [More Information Needed]
+- **Language(s) (NLP):** [More Information Needed]
+- **License:** [More Information Needed]
+- **Finetuned from model [optional]:** [More Information Needed]
+### Model Sources [optional]
+<!-- Provide the basic links for the model. -->
+- **Repository:** [More Information Needed]
+- **Paper [optional]:** [More Information Needed]
+- **Demo [optional]:** [More Information Needed]
+## Uses
+<!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
+### Direct Use
+<!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
+[More Information Needed]
+### Downstream Use [optional]
+<!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
+[More Information Needed]
+### Out-of-Scope Use
+<!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
+[More Information Needed]
+## Bias, Risks, and Limitations
+<!-- This section is meant to convey both technical and sociotechnical limitations. -->
+[More Information Needed]
+### Recommendations
+<!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
+Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
+## How to Get Started with the Model
+Use the code below to get started with the model.
+[More Information Needed]
+## Training Details
+### Training Data
+<!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
+[More Information Needed]
+### Training Procedure
+<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
+#### Preprocessing [optional]
+[More Information Needed]
+#### Training Hyperparameters
+- **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
+#### Speeds, Sizes, Times [optional]
+<!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
+[More Information Needed]
+## Evaluation
+<!-- This section describes the evaluation protocols and provides the results. -->
+### Testing Data, Factors & Metrics
+#### Testing Data
+<!-- This should link to a Dataset Card if possible. -->
+[More Information Needed]
+#### Factors
+<!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
+[More Information Needed]
+#### Metrics
+<!-- These are the evaluation metrics being used, ideally with a description of why. -->
+[More Information Needed]
+### Results
+[More Information Needed]
+#### Summary
+## Model Examination [optional]
+<!-- Relevant interpretability work for the model goes here -->
+[More Information Needed]
+## Environmental Impact
+<!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
+Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
+- **Hardware Type:** [More Information Needed]
+- **Hours used:** [More Information Needed]
+- **Cloud Provider:** [More Information Needed]
+- **Compute Region:** [More Information Needed]
+- **Carbon Emitted:** [More Information Needed]
+## Technical Specifications [optional]
+### Model Architecture and Objective
+[More Information Needed]
+### Compute Infrastructure
+[More Information Needed]
+#### Hardware
+[More Information Needed]
+#### Software
+[More Information Needed]
+## Citation [optional]
+<!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
+**BibTeX:**
+[More Information Needed]
+**APA:**
+[More Information Needed]
+## Glossary [optional]
+<!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
+[More Information Needed]
+## More Information [optional]
+[More Information Needed]
+## Model Card Authors [optional]
+[More Information Needed]
+## Model Card Contact
+[More Information Needed]
+### Framework versions
+- PEFT 0.10.0

bloomz_dam_my/adapter_config.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "bigscience/bloomz-560m",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 16,
+  "lora_dropout": 0.01,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 8,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "lm_head",
+    "query_key_value",
+    "dense_h_to_4h"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": true
+}

bloomz_dam_my/adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9baf0d7e0bee813113ef40ed93ff8433a426745af90937aabc260a737c8f5277
+size 1042757704

bloomz_dam_my/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "</s>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

bloomz_dam_my/spiece.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
+size 4309802

bloomz_dam_my/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8af11292e1e8b6e7fc393100a39b873778106b40afa8ef4e7c198f0bb5c03f82
+size 16315312

bloomz_dam_my/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [],
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "</s>",
+  "extra_ids": 0,
+  "max_length": 1024,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "</s>",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "T5Tokenizer",
+  "truncation": true,
+  "unk_token": "<unk>"
+}

bloomz_dam_my/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9fcb5d40d27446b473f3cf6a16217747341cc71590de85e4a2a9001a3be0bfca
+size 4920

runs/Apr11_04-02-02_321ddc84c049/events.out.tfevents.1712808126.321ddc84c049.414.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7dc0de91e150ffa3ae50d49ef29cc00f0d6cd90e2dfce554c500adb81011433e
+size 15910

runs/Apr11_04-04-49_321ddc84c049/events.out.tfevents.1712808294.321ddc84c049.740.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77ccd6bb0384d7f0b531b4689a6d5091c5cf8ef5fe830dd33a06449fc0a4e6c6
+size 15706

runs/Apr11_04-07-17_321ddc84c049/events.out.tfevents.1712808441.321ddc84c049.1050.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:39731fc62d56057a7ac2a4a59ab5f57cc8eafb01f7eadaa3b6146959084621fe
+size 233938

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8af11292e1e8b6e7fc393100a39b873778106b40afa8ef4e7c198f0bb5c03f82
-size 16315312

 version https://git-lfs.github.com/spec/v1
+oid sha256:54e5c72a5ea09da48b2f316760b8bc5a445683ab9a5bc6b68db5d8db624ecceb
+size 16315213

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9fcb5d40d27446b473f3cf6a16217747341cc71590de85e4a2a9001a3be0bfca
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ba44607bb84c5fd76d74e8d257eb1a18a8dceedf164c95e0e7b4eb4771e56e1
 size 4920

wandb/debug-internal.log CHANGED Viewed

The diff for this file is too large to render. See raw diff

wandb/debug.log CHANGED Viewed

@@ -1,32 +1,31 @@
-2024-04-11 03:59:09,934 INFO    MainThread:145 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Configure stats pid to 145
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Loading settings from /kaggle/working/wandb/settings
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program': '<python with no main file>'}
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Applying login settings: {}
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_setup.py:_flush():76] Applying login settings: {'api_key': '***REDACTED***'}
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_init.py:_log_setup():527] Logging user logs to /kaggle/working/wandb/run-20240411_035909-21esl9hl/logs/debug.log
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_init.py:_log_setup():528] Logging internal logs to /kaggle/working/wandb/run-20240411_035909-21esl9hl/logs/debug-internal.log
-2024-04-11 03:59:09,935 INFO    MainThread:145 [wandb_init.py:_jupyter_setup():473] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7e1d3f588970>
-2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():567] calling init triggers
-2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
 config: {}
-2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():617] starting backend
-2024-04-11 03:59:09,936 INFO    MainThread:145 [wandb_init.py:init():621] setting up manager
-2024-04-11 03:59:09,938 INFO    MainThread:145 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
-2024-04-11 03:59:09,940 INFO    MainThread:145 [wandb_init.py:init():629] backend started and connected
-2024-04-11 03:59:09,953 INFO    MainThread:145 [wandb_run.py:_label_probe_notebook():1299] probe notebook
-2024-04-11 03:59:10,362 INFO    MainThread:145 [wandb_init.py:init():721] updated telemetry
-2024-04-11 03:59:10,366 INFO    MainThread:145 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
-2024-04-11 03:59:10,526 INFO    MainThread:145 [wandb_run.py:_on_init():2344] communicating current version
-2024-04-11 03:59:10,613 INFO    MainThread:145 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.16.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
-2024-04-11 03:59:10,614 INFO    MainThread:145 [wandb_init.py:init():805] starting run threads in backend
-2024-04-11 03:59:26,715 INFO    MainThread:145 [wandb_run.py:_console_start():2323] atexit reg
-2024-04-11 03:59:26,715 INFO    MainThread:145 [wandb_run.py:_redirect():2178] redirect: wrap_raw
-2024-04-11 03:59:26,716 INFO    MainThread:145 [wandb_run.py:_redirect():2243] Wrapping output streams.
-2024-04-11 03:59:26,716 INFO    MainThread:145 [wandb_run.py:_redirect():2268] Redirects installed.
-2024-04-11 03:59:26,717 INFO    MainThread:145 [wandb_init.py:init():848] run started, returning control to user process
-2024-04-11 03:59:26,723 INFO    MainThread:145 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 250880, 'hidden_size': 1024, 'n_layer': 24, 'n_head': 16, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'use_cache': False, 'pretraining_tp': 1, 'apply_residual_connection_post_layernorm': False, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'bos_token_id': 1, 'eos_token_id': 2, 'slow_but_exact': False, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['BloomForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': 3, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'bigscience/bloomz-560m', 'transformers_version': '4.39.3', 'attention_softmax_in_fp32': True, 'bias_dropout_fusion': True, 'unk_token_id': 0, 'masked_softmax_fusion': True, 'model_type': 'bloom', 'n_inner': None, 'offset_alibi': 100, 'seq_length': 2048, 'skip_bias_add': True, 'skip_bias_add_qkv': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 10, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_03-48-59_321ddc84c049', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_32bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}

+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Configure stats pid to 1050
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Loading settings from /kaggle/working/wandb/settings
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program': '<python with no main file>'}
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Applying login settings: {}
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_init.py:_log_setup():527] Logging user logs to /kaggle/working/wandb/run-20240411_040722-rimyh9a1/logs/debug.log
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_init.py:_log_setup():528] Logging internal logs to /kaggle/working/wandb/run-20240411_040722-rimyh9a1/logs/debug-internal.log
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_init.py:_jupyter_setup():473] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7d563f5f5120>
+2024-04-11 04:07:22,844 INFO    MainThread:1050 [wandb_init.py:init():567] calling init triggers
+2024-04-11 04:07:22,844 INFO    MainThread:1050 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
 config: {}
+2024-04-11 04:07:22,844 INFO    MainThread:1050 [wandb_init.py:init():617] starting backend
+2024-04-11 04:07:22,844 INFO    MainThread:1050 [wandb_init.py:init():621] setting up manager
+2024-04-11 04:07:22,847 INFO    MainThread:1050 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-04-11 04:07:22,848 INFO    MainThread:1050 [wandb_init.py:init():629] backend started and connected
+2024-04-11 04:07:22,865 INFO    MainThread:1050 [wandb_run.py:_label_probe_notebook():1299] probe notebook
+2024-04-11 04:07:23,106 INFO    MainThread:1050 [wandb_init.py:init():721] updated telemetry
+2024-04-11 04:07:23,108 INFO    MainThread:1050 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
+2024-04-11 04:07:23,235 INFO    MainThread:1050 [wandb_run.py:_on_init():2344] communicating current version
+2024-04-11 04:07:23,323 INFO    MainThread:1050 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.16.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2024-04-11 04:07:23,324 INFO    MainThread:1050 [wandb_init.py:init():805] starting run threads in backend
+2024-04-11 04:07:39,317 INFO    MainThread:1050 [wandb_run.py:_console_start():2323] atexit reg
+2024-04-11 04:07:39,317 INFO    MainThread:1050 [wandb_run.py:_redirect():2178] redirect: wrap_raw
+2024-04-11 04:07:39,318 INFO    MainThread:1050 [wandb_run.py:_redirect():2243] Wrapping output streams.
+2024-04-11 04:07:39,318 INFO    MainThread:1050 [wandb_run.py:_redirect():2268] Redirects installed.
+2024-04-11 04:07:39,319 INFO    MainThread:1050 [wandb_init.py:init():848] run started, returning control to user process
+2024-04-11 04:07:39,324 INFO    MainThread:1050 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 250880, 'hidden_size': 1024, 'n_layer': 24, 'n_head': 16, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'use_cache': False, 'pretraining_tp': 1, 'apply_residual_connection_post_layernorm': False, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'bos_token_id': 1, 'eos_token_id': 2, 'slow_but_exact': False, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['BloomForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': 3, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'bigscience/bloomz-560m', 'transformers_version': '4.39.3', 'attention_softmax_in_fp32': True, 'bias_dropout_fusion': True, 'unk_token_id': 0, 'masked_softmax_fusion': True, 'model_type': 'bloom', 'n_inner': None, 'offset_alibi': 100, 'seq_length': 2048, 'skip_bias_add': True, 'skip_bias_add_qkv': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 20000, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_04-07-17_321ddc84c049', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_32bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}

wandb/run-20240411_035909-21esl9hl/files/output.log CHANGED Viewed

@@ -101,3 +101,4 @@ To disable this warning, you can either:
 	- Avoid using `tokenizers` before the fork if possible
 	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
 /opt/conda/lib/python3.10/site-packages/peft/utils/save_and_load.py:139: UserWarning: Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.

 	- Avoid using `tokenizers` before the fork if possible
 	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
 /opt/conda/lib/python3.10/site-packages/peft/utils/save_and_load.py:139: UserWarning: Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.
+  warnings.warn("Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.")

wandb/run-20240411_035909-21esl9hl/files/wandb-summary.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"train_runtime": 14.0567, "train_samples_per_second": 2.846, "train_steps_per_second": 0.711, "total_flos": 28907911741440.0, "train_loss": 21.220675659179687, "train/epoch": 0.0, "train/global_step": 10, "_timestamp": 1712808008.9437401, "_runtime": 59.003005027770996, "_step": 0}


1	+ {"train_runtime": 14.0567, "train_samples_per_second": 2.846, "train_steps_per_second": 0.711, "total_flos": 28907911741440.0, "train_loss": 21.220675659179687, "train/epoch": 0.0, "train/global_step": 10, "_timestamp": 1712808008.9437401, "_runtime": 59.003005027770996, "_step": 0, "_wandb": {"runtime": 91}}

wandb/run-20240411_035909-21esl9hl/logs/debug-internal.log CHANGED Viewed

@@ -116,3 +116,161 @@ subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after
 2024-04-11 04:00:27,786 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
 2024-04-11 04:00:32,787 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
 2024-04-11 04:00:37,788 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report

 2024-04-11 04:00:27,786 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
 2024-04-11 04:00:32,787 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
 2024-04-11 04:00:37,788 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:40,648 DEBUG   SenderThread:191 [sender.py:send():379] send: stats
+2024-04-11 04:00:42,143 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:00:42,144 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:00:42,184 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:00:42,200 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: pause
+2024-04-11 04:00:42,200 INFO    HandlerThread:191 [handler.py:handle_request_pause():708] stopping system metrics thread
+2024-04-11 04:00:42,200 INFO    HandlerThread:191 [system_monitor.py:finish():203] Stopping system monitor
+2024-04-11 04:00:42,200 DEBUG   SystemMonitor:191 [system_monitor.py:_start():179] Finished system metrics aggregation loop
+2024-04-11 04:00:42,200 DEBUG   SystemMonitor:191 [system_monitor.py:_start():183] Publishing last batch of metrics
+2024-04-11 04:00:42,202 INFO    HandlerThread:191 [interfaces.py:finish():202] Joined cpu monitor
+2024-04-11 04:00:42,202 INFO    HandlerThread:191 [interfaces.py:finish():202] Joined disk monitor
+2024-04-11 04:00:42,211 INFO    HandlerThread:191 [interfaces.py:finish():202] Joined gpu monitor
+2024-04-11 04:00:42,212 INFO    HandlerThread:191 [interfaces.py:finish():202] Joined memory monitor
+2024-04-11 04:00:42,212 INFO    HandlerThread:191 [interfaces.py:finish():202] Joined network monitor
+2024-04-11 04:00:42,234 DEBUG   SenderThread:191 [sender.py:send():379] send: stats
+2024-04-11 04:00:43,235 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:48,235 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:53,236 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:00:57,141 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:00:57,142 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:00:57,182 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:00:58,263 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:01:03,264 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:01:08,265 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:01:12,141 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:01:12,142 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:01:12,182 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:01:13,266 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:01:18,267 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:01:23,268 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:01:23,392 DEBUG   SenderThread:191 [sender.py:send():379] send: exit
+2024-04-11 04:01:23,392 INFO    SenderThread:191 [sender.py:send_exit():586] handling exit code: 0
+2024-04-11 04:01:23,392 INFO    SenderThread:191 [sender.py:send_exit():588] handling runtime: 91
+2024-04-11 04:01:23,394 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:01:23,394 INFO    SenderThread:191 [sender.py:send_exit():594] send defer
+2024-04-11 04:01:23,394 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:23,394 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 0
+2024-04-11 04:01:23,395 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:23,395 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 0
+2024-04-11 04:01:23,395 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 1
+2024-04-11 04:01:23,395 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:23,395 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 1
+2024-04-11 04:01:23,395 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:23,395 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 1
+2024-04-11 04:01:23,395 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 2
+2024-04-11 04:01:23,395 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:23,396 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 2
+2024-04-11 04:01:23,396 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:23,396 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 2
+2024-04-11 04:01:23,396 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 3
+2024-04-11 04:01:23,396 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:23,396 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 3
+2024-04-11 04:01:23,396 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:23,396 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 3
+2024-04-11 04:01:23,396 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 4
+2024-04-11 04:01:23,396 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:23,397 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 4
+2024-04-11 04:01:23,397 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:23,397 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 4
+2024-04-11 04:01:23,397 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 5
+2024-04-11 04:01:23,397 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:23,397 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 5
+2024-04-11 04:01:23,397 DEBUG   SenderThread:191 [sender.py:send():379] send: summary
+2024-04-11 04:01:23,398 INFO    SenderThread:191 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:01:23,398 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:23,398 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 5
+2024-04-11 04:01:23,398 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 6
+2024-04-11 04:01:23,398 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:23,398 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 6
+2024-04-11 04:01:23,398 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:23,399 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 6
+2024-04-11 04:01:23,399 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 7
+2024-04-11 04:01:23,399 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:01:23,399 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:23,399 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 7
+2024-04-11 04:01:23,399 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:23,399 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 7
+2024-04-11 04:01:23,565 INFO    Thread-12 :191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/wandb-summary.json
+2024-04-11 04:01:24,392 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:01:24,961 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 8
+2024-04-11 04:01:24,961 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:01:24,961 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:24,961 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 8
+2024-04-11 04:01:24,962 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:24,962 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 8
+2024-04-11 04:01:24,962 INFO    SenderThread:191 [job_builder.py:build():318] Attempting to build job artifact
+2024-04-11 04:01:24,964 INFO    SenderThread:191 [job_builder.py:_get_source_type():466] no source found
+2024-04-11 04:01:24,964 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 9
+2024-04-11 04:01:24,964 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:24,964 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 9
+2024-04-11 04:01:24,964 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:24,964 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 9
+2024-04-11 04:01:24,964 INFO    SenderThread:191 [dir_watcher.py:finish():358] shutting down directory watcher
+2024-04-11 04:01:25,393 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:01:25,566 INFO    SenderThread:191 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 04:01:25,567 INFO    SenderThread:191 [dir_watcher.py:finish():388] scan: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files
+2024-04-11 04:01:25,567 INFO    SenderThread:191 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/config.yaml config.yaml
+2024-04-11 04:01:25,567 INFO    SenderThread:191 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/requirements.txt requirements.txt
+2024-04-11 04:01:25,568 INFO    SenderThread:191 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/conda-environment.yaml conda-environment.yaml
+2024-04-11 04:01:25,574 INFO    SenderThread:191 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/wandb-summary.json wandb-summary.json
+2024-04-11 04:01:25,574 INFO    SenderThread:191 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/wandb-metadata.json wandb-metadata.json
+2024-04-11 04:01:25,574 INFO    SenderThread:191 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log output.log
+2024-04-11 04:01:25,575 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 10
+2024-04-11 04:01:25,575 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:01:25,578 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:25,578 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 10
+2024-04-11 04:01:25,579 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:25,579 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 10
+2024-04-11 04:01:25,579 INFO    SenderThread:191 [file_pusher.py:finish():172] shutting down file pusher
+2024-04-11 04:01:25,725 INFO    wandb-upload_1:191 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/requirements.txt
+2024-04-11 04:01:25,772 INFO    wandb-upload_0:191 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/config.yaml
+2024-04-11 04:01:25,777 INFO    wandb-upload_3:191 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/output.log
+2024-04-11 04:01:25,846 INFO    wandb-upload_2:191 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_035909-21esl9hl/files/wandb-summary.json
+2024-04-11 04:01:26,046 INFO    Thread-11 (_thread_body):191 [sender.py:transition_state():614] send defer: 11
+2024-04-11 04:01:26,046 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:26,047 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 11
+2024-04-11 04:01:26,047 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:26,047 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 11
+2024-04-11 04:01:26,047 INFO    SenderThread:191 [file_pusher.py:join():178] waiting for file pusher
+2024-04-11 04:01:26,047 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 12
+2024-04-11 04:01:26,048 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:26,048 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 12
+2024-04-11 04:01:26,048 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:26,048 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 12
+2024-04-11 04:01:26,048 INFO    SenderThread:191 [file_stream.py:finish():614] file stream finish called
+2024-04-11 04:01:26,118 INFO    SenderThread:191 [file_stream.py:finish():618] file stream finish is done
+2024-04-11 04:01:26,118 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 13
+2024-04-11 04:01:26,118 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:26,118 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 13
+2024-04-11 04:01:26,119 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:26,119 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 13
+2024-04-11 04:01:26,119 INFO    SenderThread:191 [sender.py:transition_state():614] send defer: 14
+2024-04-11 04:01:26,119 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:01:26,119 INFO    HandlerThread:191 [handler.py:handle_request_defer():172] handle defer: 14
+2024-04-11 04:01:26,120 DEBUG   SenderThread:191 [sender.py:send():379] send: final
+2024-04-11 04:01:26,120 DEBUG   SenderThread:191 [sender.py:send():379] send: footer
+2024-04-11 04:01:26,120 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:01:26,120 INFO    SenderThread:191 [sender.py:send_request_defer():610] handle sender defer: 14
+2024-04-11 04:01:26,121 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:01:26,121 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:01:26,122 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:01:26,122 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:01:26,123 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: server_info
+2024-04-11 04:01:26,123 DEBUG   SenderThread:191 [sender.py:send_request():406] send_request: server_info
+2024-04-11 04:01:26,127 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: get_summary
+2024-04-11 04:01:26,127 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: sampled_history
+2024-04-11 04:01:26,128 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:01:26,139 INFO    MainThread:191 [wandb_run.py:_footer_history_summary_info():3920] rendering history
+2024-04-11 04:01:26,139 INFO    MainThread:191 [wandb_run.py:_footer_history_summary_info():3952] rendering summary
+2024-04-11 04:01:26,139 INFO    MainThread:191 [wandb_run.py:_footer_sync_info():3879] logging synced files
+2024-04-11 04:01:26,140 DEBUG   HandlerThread:191 [handler.py:handle_request():146] handle_request: shutdown
+2024-04-11 04:01:26,140 INFO    HandlerThread:191 [handler.py:finish():866] shutting down handler
+2024-04-11 04:01:27,084 WARNING StreamThr :191 [internal.py:is_dead():414] Internal process exiting, parent pid 145 disappeared
+2024-04-11 04:01:27,084 ERROR   StreamThr :191 [internal.py:wandb_internal():152] Internal process shutdown.
+2024-04-11 04:01:27,123 INFO    WriterThread:191 [datastore.py:close():296] close: /kaggle/working/wandb/run-20240411_035909-21esl9hl/run-21esl9hl.wandb
+2024-04-11 04:01:27,139 INFO    SenderThread:191 [sender.py:finish():1546] shutting down sender
+2024-04-11 04:01:27,139 INFO    SenderThread:191 [file_pusher.py:finish():172] shutting down file pusher
+2024-04-11 04:01:27,139 INFO    SenderThread:191 [file_pusher.py:join():178] waiting for file pusher

wandb/run-20240411_035909-21esl9hl/logs/debug.log CHANGED Viewed

@@ -30,3 +30,5 @@ config: {}
 2024-04-11 03:59:26,716 INFO    MainThread:145 [wandb_run.py:_redirect():2268] Redirects installed.
 2024-04-11 03:59:26,717 INFO    MainThread:145 [wandb_init.py:init():848] run started, returning control to user process
 2024-04-11 03:59:26,723 INFO    MainThread:145 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 250880, 'hidden_size': 1024, 'n_layer': 24, 'n_head': 16, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'use_cache': False, 'pretraining_tp': 1, 'apply_residual_connection_post_layernorm': False, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'bos_token_id': 1, 'eos_token_id': 2, 'slow_but_exact': False, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['BloomForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': 3, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'bigscience/bloomz-560m', 'transformers_version': '4.39.3', 'attention_softmax_in_fp32': True, 'bias_dropout_fusion': True, 'unk_token_id': 0, 'masked_softmax_fusion': True, 'model_type': 'bloom', 'n_inner': None, 'offset_alibi': 100, 'seq_length': 2048, 'skip_bias_add': True, 'skip_bias_add_qkv': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 10, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_03-48-59_321ddc84c049', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_32bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}

 2024-04-11 03:59:26,716 INFO    MainThread:145 [wandb_run.py:_redirect():2268] Redirects installed.
 2024-04-11 03:59:26,717 INFO    MainThread:145 [wandb_init.py:init():848] run started, returning control to user process
 2024-04-11 03:59:26,723 INFO    MainThread:145 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 250880, 'hidden_size': 1024, 'n_layer': 24, 'n_head': 16, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'use_cache': False, 'pretraining_tp': 1, 'apply_residual_connection_post_layernorm': False, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'bos_token_id': 1, 'eos_token_id': 2, 'slow_but_exact': False, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['BloomForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': 3, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'bigscience/bloomz-560m', 'transformers_version': '4.39.3', 'attention_softmax_in_fp32': True, 'bias_dropout_fusion': True, 'unk_token_id': 0, 'masked_softmax_fusion': True, 'model_type': 'bloom', 'n_inner': None, 'offset_alibi': 100, 'seq_length': 2048, 'skip_bias_add': True, 'skip_bias_add_qkv': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 10, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_03-48-59_321ddc84c049', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_32bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}
+2024-04-11 04:00:42,199 INFO    MainThread:145 [jupyter.py:save_ipynb():373] not saving jupyter notebook
+2024-04-11 04:00:42,200 INFO    MainThread:145 [wandb_init.py:_pause_backend():438] pausing backend

wandb/run-20240411_035909-21esl9hl/run-21esl9hl.wandb CHANGED Viewed

Binary files a/wandb/run-20240411_035909-21esl9hl/run-21esl9hl.wandb and b/wandb/run-20240411_035909-21esl9hl/run-21esl9hl.wandb differ

wandb/run-20240411_040208-txpa3x4k/files/conda-environment.yaml ADDED Viewed

File without changes

wandb/run-20240411_040208-txpa3x4k/files/config.yaml ADDED Viewed

	@@ -0,0 +1,701 @@

+wandb_version: 1
+_wandb:
+  desc: null
+  value:
+    python_version: 3.10.13
+    cli_version: 0.16.5
+    framework: huggingface
+    huggingface_version: 4.39.3
+    is_jupyter_run: true
+    is_kaggle_kernel: true
+    start_time: 1712808128.0
+    t:
+      1:
+      - 1
+      - 2
+      - 3
+      - 5
+      - 11
+      - 12
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      - 98
+      - 105
+      2:
+      - 1
+      - 2
+      - 3
+      - 5
+      - 11
+      - 12
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      - 98
+      - 105
+      3:
+      - 7
+      - 23
+      4: 3.10.13
+      5: 0.16.5
+      6: 4.39.3
+      8:
+      - 1
+      - 2
+      - 5
+      9:
+        1: transformers_trainer
+      13: linux-x86_64
+    m:
+    - 1: train/global_step
+      6:
+      - 3
+    - 1: train/loss
+      5: 1
+      6:
+      - 1
+    - 1: train/grad_norm
+      5: 1
+      6:
+      - 1
+    - 1: train/learning_rate
+      5: 1
+      6:
+      - 1
+    - 1: train/epoch
+      5: 1
+      6:
+      - 1
+vocab_size:
+  desc: null
+  value: 250880
+hidden_size:
+  desc: null
+  value: 1024
+n_layer:
+  desc: null
+  value: 24
+n_head:
+  desc: null
+  value: 16
+layer_norm_epsilon:
+  desc: null
+  value: 1.0e-05
+initializer_range:
+  desc: null
+  value: 0.02
+use_cache:
+  desc: null
+  value: false
+pretraining_tp:
+  desc: null
+  value: 1
+apply_residual_connection_post_layernorm:
+  desc: null
+  value: false
+hidden_dropout:
+  desc: null
+  value: 0.0
+attention_dropout:
+  desc: null
+  value: 0.0
+bos_token_id:
+  desc: null
+  value: 1
+eos_token_id:
+  desc: null
+  value: 2
+slow_but_exact:
+  desc: null
+  value: false
+return_dict:
+  desc: null
+  value: true
+output_hidden_states:
+  desc: null
+  value: false
+output_attentions:
+  desc: null
+  value: false
+torchscript:
+  desc: null
+  value: false
+torch_dtype:
+  desc: null
+  value: null
+use_bfloat16:
+  desc: null
+  value: false
+tf_legacy_loss:
+  desc: null
+  value: false
+pruned_heads:
+  desc: null
+  value: {}
+tie_word_embeddings:
+  desc: null
+  value: true
+chunk_size_feed_forward:
+  desc: null
+  value: 0
+is_encoder_decoder:
+  desc: null
+  value: false
+is_decoder:
+  desc: null
+  value: false
+cross_attention_hidden_size:
+  desc: null
+  value: null
+add_cross_attention:
+  desc: null
+  value: false
+tie_encoder_decoder:
+  desc: null
+  value: false
+max_length:
+  desc: null
+  value: 20
+min_length:
+  desc: null
+  value: 0
+do_sample:
+  desc: null
+  value: false
+early_stopping:
+  desc: null
+  value: false
+num_beams:
+  desc: null
+  value: 1
+num_beam_groups:
+  desc: null
+  value: 1
+diversity_penalty:
+  desc: null
+  value: 0.0
+temperature:
+  desc: null
+  value: 1.0
+top_k:
+  desc: null
+  value: 50
+top_p:
+  desc: null
+  value: 1.0
+typical_p:
+  desc: null
+  value: 1.0
+repetition_penalty:
+  desc: null
+  value: 1.0
+length_penalty:
+  desc: null
+  value: 1.0
+no_repeat_ngram_size:
+  desc: null
+  value: 0
+encoder_no_repeat_ngram_size:
+  desc: null
+  value: 0
+bad_words_ids:
+  desc: null
+  value: null
+num_return_sequences:
+  desc: null
+  value: 1
+output_scores:
+  desc: null
+  value: false
+return_dict_in_generate:
+  desc: null
+  value: false
+forced_bos_token_id:
+  desc: null
+  value: null
+forced_eos_token_id:
+  desc: null
+  value: null
+remove_invalid_values:
+  desc: null
+  value: false
+exponential_decay_length_penalty:
+  desc: null
+  value: null
+suppress_tokens:
+  desc: null
+  value: null
+begin_suppress_tokens:
+  desc: null
+  value: null
+architectures:
+  desc: null
+  value:
+  - BloomForCausalLM
+finetuning_task:
+  desc: null
+  value: null
+id2label:
+  desc: null
+  value:
+    '0': LABEL_0
+    '1': LABEL_1
+label2id:
+  desc: null
+  value:
+    LABEL_0: 0
+    LABEL_1: 1
+tokenizer_class:
+  desc: null
+  value: null
+prefix:
+  desc: null
+  value: null
+pad_token_id:
+  desc: null
+  value: 3
+sep_token_id:
+  desc: null
+  value: null
+decoder_start_token_id:
+  desc: null
+  value: null
+task_specific_params:
+  desc: null
+  value: null
+problem_type:
+  desc: null
+  value: null
+_name_or_path:
+  desc: null
+  value: bigscience/bloomz-560m
+transformers_version:
+  desc: null
+  value: 4.39.3
+attention_softmax_in_fp32:
+  desc: null
+  value: true
+bias_dropout_fusion:
+  desc: null
+  value: true
+unk_token_id:
+  desc: null
+  value: 0
+masked_softmax_fusion:
+  desc: null
+  value: true
+model_type:
+  desc: null
+  value: bloom
+n_inner:
+  desc: null
+  value: null
+offset_alibi:
+  desc: null
+  value: 100
+seq_length:
+  desc: null
+  value: 2048
+skip_bias_add:
+  desc: null
+  value: true
+skip_bias_add_qkv:
+  desc: null
+  value: false
+quantization_config:
+  desc: null
+  value:
+    quant_method: QuantizationMethod.BITS_AND_BYTES
+    _load_in_8bit: false
+    _load_in_4bit: true
+    llm_int8_threshold: 6.0
+    llm_int8_skip_modules: null
+    llm_int8_enable_fp32_cpu_offload: false
+    llm_int8_has_fp16_weight: false
+    bnb_4bit_quant_type: nf4
+    bnb_4bit_use_double_quant: false
+    bnb_4bit_compute_dtype: float16
+    bnb_4bit_quant_storage: uint8
+    load_in_4bit: true
+    load_in_8bit: false
+output_dir:
+  desc: null
+  value: /kaggle/working/
+overwrite_output_dir:
+  desc: null
+  value: false
+do_train:
+  desc: null
+  value: false
+do_eval:
+  desc: null
+  value: false
+do_predict:
+  desc: null
+  value: false
+evaluation_strategy:
+  desc: null
+  value: 'no'
+prediction_loss_only:
+  desc: null
+  value: false
+per_device_train_batch_size:
+  desc: null
+  value: 8
+per_device_eval_batch_size:
+  desc: null
+  value: 8
+per_gpu_train_batch_size:
+  desc: null
+  value: null
+per_gpu_eval_batch_size:
+  desc: null
+  value: null
+gradient_accumulation_steps:
+  desc: null
+  value: 1
+eval_accumulation_steps:
+  desc: null
+  value: null
+eval_delay:
+  desc: null
+  value: 0
+learning_rate:
+  desc: null
+  value: 3.0e-05
+weight_decay:
+  desc: null
+  value: 0.001
+adam_beta1:
+  desc: null
+  value: 0.9
+adam_beta2:
+  desc: null
+  value: 0.999
+adam_epsilon:
+  desc: null
+  value: 1.0e-08
+max_grad_norm:
+  desc: null
+  value: 0.3
+num_train_epochs:
+  desc: null
+  value: 5
+max_steps:
+  desc: null
+  value: 7000
+lr_scheduler_type:
+  desc: null
+  value: cosine
+lr_scheduler_kwargs:
+  desc: null
+  value: {}
+warmup_ratio:
+  desc: null
+  value: 0.03
+warmup_steps:
+  desc: null
+  value: 0
+log_level:
+  desc: null
+  value: passive
+log_level_replica:
+  desc: null
+  value: warning
+log_on_each_node:
+  desc: null
+  value: true
+logging_dir:
+  desc: null
+  value: /kaggle/working/runs/Apr11_04-02-02_321ddc84c049
+logging_strategy:
+  desc: null
+  value: steps
+logging_first_step:
+  desc: null
+  value: false
+logging_steps:
+  desc: null
+  value: 20
+logging_nan_inf_filter:
+  desc: null
+  value: true
+save_strategy:
+  desc: null
+  value: steps
+save_steps:
+  desc: null
+  value: 20
+save_total_limit:
+  desc: null
+  value: 1
+save_safetensors:
+  desc: null
+  value: true
+save_on_each_node:
+  desc: null
+  value: false
+save_only_model:
+  desc: null
+  value: false
+no_cuda:
+  desc: null
+  value: false
+use_cpu:
+  desc: null
+  value: false
+use_mps_device:
+  desc: null
+  value: false
+seed:
+  desc: null
+  value: 42
+data_seed:
+  desc: null
+  value: null
+jit_mode_eval:
+  desc: null
+  value: false
+use_ipex:
+  desc: null
+  value: false
+bf16:
+  desc: null
+  value: false
+fp16:
+  desc: null
+  value: false
+fp16_opt_level:
+  desc: null
+  value: O1
+half_precision_backend:
+  desc: null
+  value: auto
+bf16_full_eval:
+  desc: null
+  value: false
+fp16_full_eval:
+  desc: null
+  value: false
+tf32:
+  desc: null
+  value: null
+local_rank:
+  desc: null
+  value: 0
+ddp_backend:
+  desc: null
+  value: null
+tpu_num_cores:
+  desc: null
+  value: null
+tpu_metrics_debug:
+  desc: null
+  value: false
+debug:
+  desc: null
+  value: []
+dataloader_drop_last:
+  desc: null
+  value: false
+eval_steps:
+  desc: null
+  value: null
+dataloader_num_workers:
+  desc: null
+  value: 8
+dataloader_prefetch_factor:
+  desc: null
+  value: null
+past_index:
+  desc: null
+  value: -1
+run_name:
+  desc: null
+  value: /kaggle/working/
+disable_tqdm:
+  desc: null
+  value: false
+remove_unused_columns:
+  desc: null
+  value: true
+label_names:
+  desc: null
+  value: null
+load_best_model_at_end:
+  desc: null
+  value: false
+metric_for_best_model:
+  desc: null
+  value: null
+greater_is_better:
+  desc: null
+  value: null
+ignore_data_skip:
+  desc: null
+  value: false
+fsdp:
+  desc: null
+  value: []
+fsdp_min_num_params:
+  desc: null
+  value: 0
+fsdp_config:
+  desc: null
+  value:
+    min_num_params: 0
+    xla: false
+    xla_fsdp_v2: false
+    xla_fsdp_grad_ckpt: false
+fsdp_transformer_layer_cls_to_wrap:
+  desc: null
+  value: null
+accelerator_config:
+  desc: null
+  value:
+    split_batches: false
+    dispatch_batches: null
+    even_batches: true
+    use_seedable_sampler: true
+deepspeed:
+  desc: null
+  value: null
+label_smoothing_factor:
+  desc: null
+  value: 0.0
+optim:
+  desc: null
+  value: paged_adamw_32bit
+optim_args:
+  desc: null
+  value: null
+adafactor:
+  desc: null
+  value: false
+group_by_length:
+  desc: null
+  value: false
+length_column_name:
+  desc: null
+  value: length
+report_to:
+  desc: null
+  value:
+  - tensorboard
+  - wandb
+ddp_find_unused_parameters:
+  desc: null
+  value: null
+ddp_bucket_cap_mb:
+  desc: null
+  value: null
+ddp_broadcast_buffers:
+  desc: null
+  value: null
+dataloader_pin_memory:
+  desc: null
+  value: true
+dataloader_persistent_workers:
+  desc: null
+  value: false
+skip_memory_metrics:
+  desc: null
+  value: true
+use_legacy_prediction_loop:
+  desc: null
+  value: false
+push_to_hub:
+  desc: null
+  value: false
+resume_from_checkpoint:
+  desc: null
+  value: null
+hub_model_id:
+  desc: null
+  value: null
+hub_strategy:
+  desc: null
+  value: every_save
+hub_token:
+  desc: null
+  value: <HUB_TOKEN>
+hub_private_repo:
+  desc: null
+  value: false
+hub_always_push:
+  desc: null
+  value: false
+gradient_checkpointing:
+  desc: null
+  value: true
+gradient_checkpointing_kwargs:
+  desc: null
+  value: null
+include_inputs_for_metrics:
+  desc: null
+  value: false
+fp16_backend:
+  desc: null
+  value: auto
+push_to_hub_model_id:
+  desc: null
+  value: null
+push_to_hub_organization:
+  desc: null
+  value: null
+push_to_hub_token:
+  desc: null
+  value: <PUSH_TO_HUB_TOKEN>
+mp_parameters:
+  desc: null
+  value: ''
+auto_find_batch_size:
+  desc: null
+  value: true
+full_determinism:
+  desc: null
+  value: false
+torchdynamo:
+  desc: null
+  value: null
+ray_scope:
+  desc: null
+  value: last
+ddp_timeout:
+  desc: null
+  value: 1800
+torch_compile:
+  desc: null
+  value: false
+torch_compile_backend:
+  desc: null
+  value: null
+torch_compile_mode:
+  desc: null
+  value: null
+dispatch_batches:
+  desc: null
+  value: null
+split_batches:
+  desc: null
+  value: null
+include_tokens_per_second:
+  desc: null
+  value: false
+include_num_input_tokens_seen:
+  desc: null
+  value: false
+neftune_noise_alpha:
+  desc: null
+  value: null
+optim_target_modules:
+  desc: null
+  value: null

wandb/run-20240411_040208-txpa3x4k/files/output.log ADDED Viewed

	@@ -0,0 +1,18 @@

+/opt/conda/lib/python3.10/site-packages/torch/utils/data/dataloader.py:557: UserWarning: This DataLoader will create 8 worker processes in total. Our suggested max number of worker in current system is 4, which is smaller than what this DataLoader is going to create. Please be aware that excessive worker creation might get DataLoader running slow or even freeze, lower the worker number to avoid potential slowness/freeze if necessary.
+  warnings.warn(_create_warning_msg(
+/opt/conda/lib/python3.10/site-packages/torch/utils/checkpoint.py:429: UserWarning: torch.utils.checkpoint: please pass in use_reentrant=True or use_reentrant=False explicitly. The default value of use_reentrant will be updated to be False in the future. To maintain current behavior, pass use_reentrant=True. It is recommended that you use use_reentrant=False. Refer to docs for more details on the differences between the two variants.
+  warnings.warn(
+/opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
+  warnings.warn('Was asked to gather along dimension 0, but all '
+/opt/conda/lib/python3.10/site-packages/peft/utils/save_and_load.py:139: UserWarning: Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.
+  warnings.warn("Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.")
+/opt/conda/lib/python3.10/site-packages/torch/utils/checkpoint.py:429: UserWarning: torch.utils.checkpoint: please pass in use_reentrant=True or use_reentrant=False explicitly. The default value of use_reentrant will be updated to be False in the future. To maintain current behavior, pass use_reentrant=True. It is recommended that you use use_reentrant=False. Refer to docs for more details on the differences between the two variants.
+  warnings.warn(
+/opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
+  warnings.warn('Was asked to gather along dimension 0, but all '
+/opt/conda/lib/python3.10/site-packages/peft/utils/save_and_load.py:139: UserWarning: Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.
+  warnings.warn("Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.")
+/opt/conda/lib/python3.10/site-packages/torch/utils/checkpoint.py:429: UserWarning: torch.utils.checkpoint: please pass in use_reentrant=True or use_reentrant=False explicitly. The default value of use_reentrant will be updated to be False in the future. To maintain current behavior, pass use_reentrant=True. It is recommended that you use use_reentrant=False. Refer to docs for more details on the differences between the two variants.
+  warnings.warn(
+/opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
+  warnings.warn('Was asked to gather along dimension 0, but all '

wandb/run-20240411_040208-txpa3x4k/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,864 @@

+Babel==2.14.0
+Boruta==0.3
+Brotli==1.0.9
+CVXcanon==0.1.2
+Cartopy==0.22.0
+Cython==3.0.8
+Deprecated==1.2.14
+Farama-Notifications==0.0.4
+Flask==3.0.2
+Geohash==1.0
+GitPython==3.1.41
+ImageHash==4.3.1
+Janome==0.5.0
+Jinja2==3.1.2
+LunarCalendar==0.0.9
+Mako==1.3.2
+Markdown==3.5.2
+MarkupSafe==2.1.3
+MarkupSafe==2.1.5
+Pillow==9.5.0
+PuLP==2.8.0
+PyArabic==0.6.15
+PyJWT==2.8.0
+PyMeeus==0.5.12
+PySocks==1.7.1
+PyUpSet==0.1.1.post7
+PyWavelets==1.5.0
+PyYAML==6.0.1
+Pygments==2.17.2
+Pympler==1.0.1
+QtPy==2.4.1
+Rtree==1.2.0
+SQLAlchemy==2.0.25
+SecretStorage==3.3.3
+Send2Trash==1.8.2
+Shapely==1.8.5.post1
+Shimmy==1.3.0
+SimpleITK==2.3.1
+TPOT==0.12.1
+Theano-PyMC==1.1.2
+Theano==1.0.5
+Wand==0.6.13
+Werkzeug==3.0.2
+absl-py==1.4.0
+accelerate==0.28.0
+access==1.1.9
+affine==2.4.0
+aiobotocore==2.12.2
+aiofiles==22.1.0
+aiohttp-cors==0.7.0
+aiohttp==3.9.1
+aioitertools==0.11.0
+aiorwlock==1.3.0
+aiosignal==1.3.1
+aiosqlite==0.19.0
+albumentations==1.4.0
+alembic==1.13.1
+altair==5.3.0
+annotated-types==0.6.0
+annoy==1.17.3
+anyio==4.2.0
+apache-beam==2.46.0
+aplus==0.11.0
+appdirs==1.4.4
+archspec==0.2.3
+argon2-cffi-bindings==21.2.0
+argon2-cffi==23.1.0
+array-record==0.5.0
+arrow==1.3.0
+arviz==0.17.1
+astroid==3.1.0
+astropy-iers-data==0.2024.4.1.0.33.14
+astropy==6.0.1
+asttokens==2.4.1
+astunparse==1.6.3
+async-lru==2.0.4
+async-timeout==4.0.3
+attrs==23.2.0
+audioread==3.0.1
+autopep8==2.0.4
+backoff==2.2.1
+bayesian-optimization==1.4.3
+beatrix_jupyterlab==2023.128.151533
+beautifulsoup4==4.12.2
+bitsandbytes==0.43.0
+blake3==0.2.1
+bleach==6.1.0
+blessed==1.20.0
+blinker==1.7.0
+blis==0.7.10
+blosc2==2.6.0
+bokeh==3.3.4
+boltons==23.1.1
+boto3==1.26.100
+botocore==1.34.51
+bq_helper==0.4.1
+bqplot==0.12.43
+branca==0.7.1
+brewer2mpl==1.4.1
+brotlipy==0.7.0
+cached-property==1.5.2
+cachetools==4.2.4
+cachetools==5.3.2
+catalogue==2.0.10
+catalyst==22.4
+catboost==1.2.3
+category-encoders==2.6.3
+certifi==2024.2.2
+cesium==0.12.1
+cffi==1.16.0
+charset-normalizer==3.3.2
+chex==0.1.86
+cleverhans==4.0.0
+click-plugins==1.1.1
+click==8.1.7
+cligj==0.7.2
+cloud-tpu-client==0.10
+cloud-tpu-profiler==2.4.0
+cloudpathlib==0.16.0
+cloudpickle==2.2.1
+cloudpickle==3.0.0
+cmdstanpy==1.2.2
+colorama==0.4.6
+colorcet==3.1.0
+colorful==0.5.6
+colorlog==6.8.2
+colorlover==0.3.0
+comm==0.2.1
+conda-libmamba-solver==23.7.0
+conda-package-handling==2.2.0
+conda==23.7.4
+conda_package_streaming==0.9.0
+confection==0.1.4
+contextily==1.6.0
+contourpy==1.2.0
+convertdate==2.4.0
+crcmod==1.7
+cryptography==41.0.7
+cuda-python==12.4.0
+cudf==23.8.0
+cufflinks==0.17.3
+cuml==23.8.0
+cupy==13.0.0
+cycler==0.12.1
+cymem==2.0.8
+cytoolz==0.12.3
+daal4py==2024.2.0
+daal==2024.2.0
+dacite==1.8.1
+dask-cuda==23.8.0
+dask-cudf==23.8.0
+dask-expr==1.0.9
+dask==2024.4.0
+dataclasses-json==0.6.4
+dataproc_jupyter_plugin==0.1.66
+datasets==2.16.0
+datashader==0.16.0
+datatile==1.0.3
+db-dtypes==1.2.0
+deap==1.4.1
+debugpy==1.8.0
+decorator==5.1.1
+deepdiff==6.7.1
+defusedxml==0.7.1
+deprecation==2.1.0
+descartes==1.1.0
+dill==0.3.7
+dipy==1.9.0
+distlib==0.3.8
+distributed==2023.7.1
+distro==1.9.0
+dm-tree==0.1.8
+docker-pycreds==0.4.0
+docker==7.0.0
+docopt==0.6.2
+docstring-parser==0.15
+docstring-to-markdown==0.15
+docutils==0.20.1
+earthengine-api==0.1.395
+easydict==1.13
+easyocr==1.7.1
+ecos==2.0.13
+eli5==0.13.0
+emoji==2.11.0
+en-core-web-lg==3.7.1
+en-core-web-sm==3.7.1
+entrypoints==0.4
+ephem==4.1.5
+esda==2.5.1
+essentia==2.1b6.dev1110
+et-xmlfile==1.1.0
+etils==1.6.0
+exceptiongroup==1.2.0
+executing==2.0.1
+explainable-ai-sdk==1.3.3
+fastai==2.7.14
+fastapi==0.108.0
+fastavro==1.9.3
+fastcore==1.5.29
+fastdownload==0.0.7
+fasteners==0.19
+fastjsonschema==2.19.1
+fastprogress==1.0.3
+fastrlock==0.8.2
+fasttext==0.9.2
+feather-format==0.4.1
+featuretools==1.30.0
+filelock==3.13.1
+fiona==1.9.6
+fitter==1.7.0
+flake8==7.0.0
+flashtext==2.7
+flatbuffers==23.5.26
+flax==0.8.2
+folium==0.16.0
+fonttools==4.47.0
+fonttools==4.50.0
+fqdn==1.5.1
+frozendict==2.4.1
+frozenlist==1.4.1
+fsspec==2023.10.0
+fsspec==2024.3.1
+funcy==2.0
+fury==0.10.0
+future==1.0.0
+fuzzywuzzy==0.18.0
+gast==0.5.4
+gatspy==0.3
+gcsfs==2024.2.0
+gensim==4.3.2
+geographiclib==2.0
+geojson==3.1.0
+geopandas==0.14.3
+geoplot==0.5.1
+geopy==2.4.1
+geoviews==1.11.1
+ggplot==0.11.5
+giddy==2.3.5
+gitdb==4.0.11
+google-ai-generativelanguage==0.4.0
+google-api-core==2.11.1
+google-api-core==2.18.0
+google-api-python-client==2.125.0
+google-apitools==0.5.31
+google-auth-httplib2==0.2.0
+google-auth-oauthlib==1.2.0
+google-auth==2.26.1
+google-cloud-aiplatform==0.6.0a1
+google-cloud-artifact-registry==1.10.0
+google-cloud-automl==1.0.1
+google-cloud-bigquery==2.34.4
+google-cloud-bigtable==1.7.3
+google-cloud-core==2.4.1
+google-cloud-datastore==2.19.0
+google-cloud-dlp==3.14.0
+google-cloud-jupyter-config==0.0.5
+google-cloud-language==2.13.3
+google-cloud-monitoring==2.18.0
+google-cloud-pubsub==2.19.0
+google-cloud-pubsublite==1.9.0
+google-cloud-recommendations-ai==0.7.1
+google-cloud-resource-manager==1.11.0
+google-cloud-spanner==3.40.1
+google-cloud-storage==1.44.0
+google-cloud-translate==3.12.1
+google-cloud-videointelligence==2.13.3
+google-cloud-vision==2.8.0
+google-crc32c==1.5.0
+google-generativeai==0.4.1
+google-pasta==0.2.0
+google-resumable-media==2.7.0
+googleapis-common-protos==1.62.0
+gplearn==0.4.2
+gpustat==1.0.0
+gpxpy==1.6.2
+graphviz==0.20.3
+greenlet==3.0.3
+grpc-google-iam-v1==0.12.7
+grpcio-status==1.48.1
+grpcio-status==1.48.2
+grpcio==1.51.1
+grpcio==1.60.0
+gviz-api==1.10.0
+gym-notices==0.0.8
+gym==0.26.2
+gymnasium==0.29.0
+h11==0.14.0
+h2o==3.46.0.1
+h5netcdf==1.3.0
+h5py==3.10.0
+haversine==2.8.1
+hdfs==2.7.3
+hep-ml==0.7.2
+hijri-converter==2.3.1
+hmmlearn==0.3.2
+holidays==0.24
+holoviews==1.18.3
+hpsklearn==0.1.0
+html5lib==1.1
+htmlmin==0.1.12
+httpcore==1.0.5
+httplib2==0.21.0
+httptools==0.6.1
+httpx==0.27.0
+huggingface-hub==0.22.2
+hunspell==0.5.5
+hydra-slayer==0.5.0
+hyperopt==0.2.7
+hypertools==0.8.0
+idna==3.6
+igraph==0.11.4
+imagecodecs==2024.1.1
+imageio==2.33.1
+imbalanced-learn==0.12.2
+imgaug==0.4.0
+importlib-metadata==6.11.0
+importlib-metadata==7.0.1
+importlib-resources==6.1.1
+inequality==1.0.1
+iniconfig==2.0.0
+ipydatawidgets==4.3.5
+ipykernel==6.28.0
+ipyleaflet==0.18.2
+ipympl==0.7.0
+ipython-genutils==0.2.0
+ipython-genutils==0.2.0
+ipython-sql==0.5.0
+ipython==8.20.0
+ipyvolume==0.6.3
+ipyvue==1.10.2
+ipyvuetify==1.9.3
+ipywebrtc==0.6.0
+ipywidgets==7.7.1
+isoduration==20.11.0
+isort==5.13.2
+isoweek==1.3.3
+itsdangerous==2.1.2
+jaraco.classes==3.3.0
+jax-jumpy==1.0.0
+jax==0.4.23
+jaxlib==0.4.23.dev20240116
+jedi==0.19.1
+jeepney==0.8.0
+jieba==0.42.1
+jmespath==1.0.1
+joblib==1.3.2
+json5==0.9.14
+jsonpatch==1.33
+jsonpointer==2.4
+jsonschema-specifications==2023.12.1
+jsonschema==4.20.0
+jupyter-console==6.6.3
+jupyter-events==0.9.0
+jupyter-http-over-ws==0.0.8
+jupyter-lsp==1.5.1
+jupyter-server-mathjax==0.2.6
+jupyter-ydoc==0.2.5
+jupyter_client==7.4.9
+jupyter_client==8.6.0
+jupyter_core==5.7.1
+jupyter_server==2.13.0
+jupyter_server_fileid==0.9.1
+jupyter_server_proxy==4.1.0
+jupyter_server_terminals==0.5.1
+jupyter_server_ydoc==0.8.0
+jupyterlab-lsp==5.1.0
+jupyterlab-widgets==3.0.9
+jupyterlab==4.1.5
+jupyterlab_git==0.44.0
+jupyterlab_pygments==0.3.0
+jupyterlab_server==2.25.2
+jupytext==1.16.0
+kaggle-environments==1.14.3
+kaggle==1.6.8
+kagglehub==0.2.2
+keras-cv==0.8.2
+keras-nlp==0.8.2
+keras-tuner==1.4.6
+keras==3.1.1
+kernels-mixer==0.0.7
+keyring==24.3.0
+keyrings.google-artifactregistry-auth==1.1.2
+kfp-pipeline-spec==0.2.2
+kfp-server-api==2.0.5
+kfp==2.5.0
+kiwisolver==1.4.5
+kmapper==2.0.1
+kmodes==0.12.2
+korean-lunar-calendar==0.3.1
+kornia==0.7.2
+kornia_rs==0.1.3
+kt-legacy==1.0.5
+kubernetes==26.1.0
+langcodes==3.3.0
+langid==1.1.6
+lazy_loader==0.3
+learntools==0.3.4
+leven==1.0.4
+libclang==16.0.6
+libmambapy==1.5.0
+libpysal==4.9.2
+librosa==0.10.1
+lightgbm==4.2.0
+lightning-utilities==0.11.2
+lime==0.2.0.1
+line-profiler==4.1.2
+linkify-it-py==2.0.3
+llvmlite==0.41.1
+llvmlite==0.42.0
+lml==0.1.0
+locket==1.0.0
+loguru==0.7.2
+lxml==5.2.1
+lz4==4.3.3
+mamba==1.5.0
+mapclassify==2.6.1
+markdown-it-py==3.0.0
+marshmallow==3.21.1
+matplotlib-inline==0.1.6
+matplotlib-venn==0.11.10
+matplotlib==3.7.5
+matplotlib==3.8.3
+mccabe==0.7.0
+mdit-py-plugins==0.4.0
+mdurl==0.1.2
+memory-profiler==0.61.0
+menuinst==2.0.1
+mercantile==1.2.1
+mgwr==2.2.1
+missingno==0.5.2
+mistune==0.8.4
+mizani==0.11.1
+ml-dtypes==0.2.0
+mlcrate==0.2.0
+mlens==0.2.3
+mlxtend==0.23.1
+mne==1.6.1
+mnist==0.2.2
+momepy==0.7.0
+more-itertools==10.2.0
+mpld3==0.5.10
+mpmath==1.3.0
+msgpack==1.0.7
+multidict==6.0.4
+multimethod==1.10
+multipledispatch==1.0.0
+multiprocess==0.70.15
+munkres==1.1.4
+murmurhash==1.0.10
+mypy-extensions==1.0.0
+namex==0.0.7
+nb-conda-kernels==2.3.1
+nb_conda==2.2.1
+nbclassic==1.0.0
+nbclient==0.5.13
+nbconvert==6.4.5
+nbdime==3.2.0
+nbformat==5.9.2
+ndindex==1.8
+nest-asyncio==1.5.8
+networkx==3.2.1
+nibabel==5.2.1
+nilearn==0.10.3
+ninja==1.11.1.1
+nltk==3.2.4
+nose==1.3.7
+notebook==6.5.4
+notebook==6.5.6
+notebook_executor==0.2
+notebook_shim==0.2.3
+numba==0.58.1
+numba==0.59.1
+numexpr==2.10.0
+numpy==1.26.4
+nvidia-ml-py==11.495.46
+nvtx==0.2.10
+oauth2client==4.1.3
+oauthlib==3.2.2
+objsize==0.6.1
+odfpy==1.4.1
+olefile==0.47
+onnx==1.16.0
+opencensus-context==0.1.3
+opencensus==0.11.4
+opencv-contrib-python==4.9.0.80
+opencv-python-headless==4.9.0.80
+opencv-python==4.9.0.80
+openpyxl==3.1.2
+openslide-python==1.3.1
+opentelemetry-api==1.22.0
+opentelemetry-exporter-otlp-proto-common==1.22.0
+opentelemetry-exporter-otlp-proto-grpc==1.22.0
+opentelemetry-exporter-otlp-proto-http==1.22.0
+opentelemetry-exporter-otlp==1.22.0
+opentelemetry-proto==1.22.0
+opentelemetry-sdk==1.22.0
+opentelemetry-semantic-conventions==0.43b0
+opt-einsum==3.3.0
+optax==0.2.2
+optree==0.11.0
+optuna==3.6.1
+orbax-checkpoint==0.5.7
+ordered-set==4.1.0
+orjson==3.9.10
+ortools==9.4.1874
+osmnx==1.9.2
+overrides==7.4.0
+packaging==21.3
+pandas-datareader==0.10.0
+pandas-profiling==3.6.6
+pandas-summary==0.2.0
+pandas==2.1.4
+pandas==2.2.1
+pandasql==0.7.3
+pandocfilters==1.5.0
+panel==1.3.8
+papermill==2.5.0
+param==2.1.0
+parso==0.8.3
+partd==1.4.1
+path.py==12.5.0
+path==16.10.0
+pathos==0.3.2
+pathy==0.10.3
+patsy==0.5.6
+pdf2image==1.17.0
+peft==0.10.0
+pettingzoo==1.24.0
+pexpect==4.8.0
+pexpect==4.9.0
+phik==0.12.4
+pickleshare==0.7.5
+pillow==10.3.0
+pip==23.3.2
+pkgutil_resolve_name==1.3.10
+platformdirs==4.2.0
+plotly-express==0.4.1
+plotly==5.18.0
+plotnine==0.13.4
+pluggy==1.4.0
+pointpats==2.4.0
+polars==0.20.18
+polyglot==16.7.4
+pooch==1.8.1
+pox==0.3.4
+ppca==0.0.4
+ppft==1.7.6.8
+preprocessing==0.1.13
+preshed==3.0.9
+prettytable==3.9.0
+progressbar2==4.4.2
+prometheus-client==0.19.0
+promise==2.3
+prompt-toolkit==3.0.42
+prompt-toolkit==3.0.43
+prophet==1.1.1
+proto-plus==1.23.0
+protobuf==3.20.3
+protobuf==4.21.12
+psutil==5.9.3
+psutil==5.9.7
+ptyprocess==0.7.0
+pudb==2024.1
+pure-eval==0.2.2
+py-cpuinfo==9.0.0
+py-spy==0.3.14
+py4j==0.10.9.7
+pyLDAvis==3.4.1
+pyOpenSSL==23.3.0
+pyaml==23.12.0
+pyarrow-hotfix==0.6
+pyarrow==15.0.2
+pyasn1-modules==0.3.0
+pyasn1==0.5.1
+pybind11==2.12.0
+pyclipper==1.3.0.post5
+pycodestyle==2.11.1
+pycosat==0.6.6
+pycparser==2.21
+pycryptodome==3.20.0
+pyct==0.5.0
+pycuda==2024.1
+pydantic==2.5.3
+pydantic==2.6.4
+pydantic_core==2.14.6
+pydantic_core==2.16.3
+pydegensac==0.1.2
+pydicom==2.4.4
+pydocstyle==6.3.0
+pydot==1.4.2
+pydub==0.25.1
+pyemd==1.0.0
+pyerfa==2.0.1.1
+pyexcel-io==0.6.6
+pyexcel-ods==0.6.0
+pyflakes==3.2.0
+pygltflib==1.16.2
+pykalman==0.9.7
+pylibraft==23.8.0
+pylint==3.1.0
+pymc3==3.11.4
+pymongo==3.13.0
+pynndescent==0.5.12
+pynvml==11.4.1
+pynvrtc==9.2
+pyparsing==3.1.1
+pyparsing==3.1.2
+pypdf==4.1.0
+pyproj==3.6.1
+pysal==24.1
+pyshp==2.3.1
+pytesseract==0.3.10
+pytest==8.1.1
+python-bidi==0.4.2
+python-dateutil==2.9.0.post0
+python-dotenv==1.0.0
+python-json-logger==2.0.7
+python-louvain==0.16
+python-lsp-jsonrpc==1.1.2
+python-lsp-server==1.11.0
+python-slugify==8.0.4
+python-utils==3.8.2
+pythreejs==2.4.2
+pytoolconfig==1.3.1
+pytools==2024.1.1
+pytorch-ignite==0.5.0.post2
+pytorch-lightning==2.2.1
+pytz==2023.3.post1
+pytz==2024.1
+pyu2f==0.1.5
+pyviz_comms==3.0.2
+pyzmq==24.0.1
+pyzmq==25.1.2
+qgrid==1.3.1
+qtconsole==5.5.1
+quantecon==0.7.2
+qudida==0.0.4
+raft-dask==23.8.0
+rasterio==1.3.9
+rasterstats==0.19.0
+ray-cpp==2.9.0
+ray==2.9.0
+referencing==0.32.1
+regex==2023.12.25
+requests-oauthlib==1.3.1
+requests-toolbelt==0.10.1
+requests==2.31.0
+retrying==1.3.3
+retrying==1.3.4
+rfc3339-validator==0.1.4
+rfc3986-validator==0.1.1
+rgf-python==3.12.0
+rich-click==1.7.4
+rich==13.7.0
+rich==13.7.1
+rmm==23.8.0
+rope==1.13.0
+rpds-py==0.16.2
+rsa==4.9
+ruamel-yaml-conda==0.15.100
+ruamel.yaml.clib==0.2.7
+ruamel.yaml==0.17.40
+s2sphere==0.2.5
+s3fs==2024.2.0
+s3transfer==0.6.2
+safetensors==0.4.2
+scattertext==0.1.19
+scikit-image==0.22.0
+scikit-learn-intelex==2024.2.0
+scikit-learn==1.2.2
+scikit-multilearn==0.2.0
+scikit-optimize==0.10.1
+scikit-plot==0.3.7
+scikit-surprise==1.1.3
+scipy==1.11.4
+scipy==1.12.0
+seaborn==0.12.2
+segment_anything==1.0
+segregation==2.5
+semver==3.0.2
+sentencepiece==0.2.0
+sentry-sdk==1.44.1
+setproctitle==1.3.3
+setuptools-git==1.2
+setuptools-scm==8.0.4
+setuptools==69.0.3
+shap==0.44.1
+shapely==2.0.3
+shellingham==1.5.4
+shtab==1.7.1
+simpervisor==1.0.0
+simplejson==3.19.2
+six==1.16.0
+sklearn-pandas==2.2.0
+slicer==0.0.7
+smart-open==6.4.0
+smmap==5.0.1
+sniffio==1.3.0
+snowballstemmer==2.2.0
+snuggs==1.4.7
+sortedcontainers==2.4.0
+soundfile==0.12.1
+soupsieve==2.5
+soxr==0.3.7
+spacy-legacy==3.0.12
+spacy-loggers==1.0.5
+spacy==3.7.2
+spaghetti==1.7.5.post1
+spectral==0.23.1
+spglm==1.1.0
+sphinx-rtd-theme==0.2.4
+spint==1.0.7
+splot==1.1.5.post1
+spopt==0.6.0
+spreg==1.4.2
+spvcm==0.3.0
+sqlparse==0.4.4
+squarify==0.4.3
+srsly==2.4.8
+stable-baselines3==2.1.0
+stack-data==0.6.2
+stack-data==0.6.3
+stanio==0.5.0
+starlette==0.32.0.post1
+statsmodels==0.14.1
+stemming==1.0.1
+stop-words==2018.7.23
+stopit==1.1.2
+stumpy==1.12.0
+sympy==1.12
+tables==3.9.2
+tabulate==0.9.0
+tangled-up-in-unicode==0.2.0
+tbb==2021.12.0
+tblib==3.0.0
+tenacity==8.2.3
+tensorboard-data-server==0.7.2
+tensorboard-plugin-profile==2.15.0
+tensorboard==2.15.1
+tensorboardX==2.6.2.2
+tensorflow-cloud==0.1.16
+tensorflow-datasets==4.9.4
+tensorflow-decision-forests==1.8.1
+tensorflow-estimator==2.15.0
+tensorflow-hub==0.16.1
+tensorflow-io-gcs-filesystem==0.35.0
+tensorflow-io==0.35.0
+tensorflow-metadata==0.14.0
+tensorflow-probability==0.23.0
+tensorflow-serving-api==2.14.1
+tensorflow-text==2.15.0
+tensorflow-transform==0.14.0
+tensorflow==2.15.0
+tensorstore==0.1.56
+termcolor==2.4.0
+terminado==0.18.0
+testpath==0.6.0
+text-unidecode==1.3
+textblob==0.18.0.post0
+texttable==1.7.0
+tf_keras==2.15.1
+tfp-nightly==0.24.0.dev0
+thinc==8.2.2
+threadpoolctl==3.2.0
+tifffile==2023.12.9
+timm==0.9.16
+tinycss2==1.2.1
+tobler==0.11.2
+tokenizers==0.15.2
+toml==0.10.2
+tomli==2.0.1
+tomlkit==0.12.4
+toolz==0.12.1
+torch==2.1.2
+torchaudio==2.1.2
+torchdata==0.7.1
+torchinfo==1.8.0
+torchmetrics==1.3.2
+torchtext==0.16.2
+torchvision==0.16.2
+tornado==6.3.3
+tqdm==4.66.1
+traceml==1.0.8
+traitlets==5.9.0
+traittypes==0.2.1
+transformers==4.39.3
+treelite-runtime==3.2.0
+treelite==3.2.0
+trl==0.8.1
+truststore==0.8.0
+trx-python==0.2.9
+tsfresh==0.20.2
+typeguard==4.1.5
+typer==0.9.0
+typer==0.9.4
+types-python-dateutil==2.8.19.20240106
+typing-inspect==0.9.0
+typing-utils==0.1.0
+typing_extensions==4.9.0
+tyro==0.8.3
+tzdata==2023.4
+uc-micro-py==1.0.3
+ucx-py==0.33.0
+ujson==5.9.0
+umap-learn==0.5.5
+unicodedata2==15.1.0
+update-checker==0.18.0
+uri-template==1.3.0
+uritemplate==3.0.1
+urllib3==1.26.18
+urllib3==2.1.0
+urwid==2.6.10
+urwid_readline==0.14
+uvicorn==0.25.0
+uvloop==0.19.0
+vaex-astro==0.9.3
+vaex-core==4.17.1
+vaex-hdf5==0.14.1
+vaex-jupyter==0.8.2
+vaex-ml==0.18.3
+vaex-server==0.9.0
+vaex-viz==0.5.4
+vaex==4.17.0
+vec_noise==1.1.4
+vecstack==0.4.0
+virtualenv==20.21.0
+visions==0.7.5
+vowpalwabbit==9.9.0
+vtk==9.3.0
+wandb==0.16.5
+wasabi==1.1.2
+watchfiles==0.21.0
+wavio==0.0.8
+wcwidth==0.2.13
+weasel==0.3.4
+webcolors==1.13
+webencodings==0.5.1
+websocket-client==1.7.0
+websockets==12.0
+wfdb==4.1.2
+whatthepatch==1.0.5
+wheel==0.42.0
+widgetsnbextension==3.6.6
+witwidget==1.8.1
+woodwork==0.29.0
+wordcloud==1.9.3
+wordsegment==1.3.1
+wrapt==1.14.1
+xarray-einstats==0.7.0
+xarray==2024.3.0
+xgboost==2.0.3
+xvfbwrapper==0.2.9
+xxhash==3.4.1
+xyzservices==2023.10.1
+y-py==0.6.2
+yapf==0.40.2
+yarl==1.9.3
+yarl==1.9.4
+ydata-profiling==4.6.4
+yellowbrick==1.5
+ypy-websocket==0.8.4
+zict==3.0.0
+zipp==3.17.0
+zstandard==0.22.0

wandb/run-20240411_040208-txpa3x4k/files/wandb-metadata.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+    "os": "Linux-5.15.133+-x86_64-with-glibc2.31",
+    "python": "3.10.13",
+    "heartbeatAt": "2024-04-11T04:02:08.804959",
+    "startedAt": "2024-04-11T04:02:08.129415",
+    "docker": null,
+    "cuda": null,
+    "args": [],
+    "state": "running",
+    "program": "kaggle.ipynb",
+    "codePathLocal": null,
+    "root": "/kaggle/working",
+    "host": "321ddc84c049",
+    "username": "root",
+    "executable": "/opt/conda/bin/python3.10",
+    "cpu_count": 2,
+    "cpu_count_logical": 4,
+    "cpu_freq": {
+        "current": 2000.19,
+        "min": 0.0,
+        "max": 0.0
+    },
+    "cpu_freq_per_core": [
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        }
+    ],
+    "disk": {
+        "/": {
+            "total": 8062.387607574463,
+            "used": 5566.961982727051
+        }
+    },
+    "gpu": "Tesla T4",
+    "gpu_count": 2,
+    "gpu_devices": [
+        {
+            "name": "Tesla T4",
+            "memory_total": 16106127360
+        },
+        {
+            "name": "Tesla T4",
+            "memory_total": 16106127360
+        }
+    ],
+    "memory": {
+        "total": 31.357559204101562
+    }
+}

wandb/run-20240411_040208-txpa3x4k/files/wandb-summary.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"train/loss": 27.1232, "train/grad_norm": 212.8720245361328, "train/learning_rate": 5.7142857142857145e-06, "train/epoch": 0.0, "train/global_step": 40, "_timestamp": 1712808237.341076, "_runtime": 109.20561385154724, "_step": 1, "_wandb": {"runtime": 120}}

wandb/run-20240411_040208-txpa3x4k/logs/debug-internal.log ADDED Viewed

	@@ -0,0 +1,273 @@

+2024-04-11 04:02:08,136 INFO    StreamThr :455 [internal.py:wandb_internal():86] W&B internal server running at pid: 455, started at: 2024-04-11 04:02:08.135570
+2024-04-11 04:02:08,137 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status
+2024-04-11 04:02:08,532 INFO    WriterThread:455 [datastore.py:open_for_write():87] open: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/run-txpa3x4k.wandb
+2024-04-11 04:02:08,532 DEBUG   SenderThread:455 [sender.py:send():379] send: header
+2024-04-11 04:02:08,535 DEBUG   SenderThread:455 [sender.py:send():379] send: run
+2024-04-11 04:02:08,682 INFO    SenderThread:455 [dir_watcher.py:__init__():211] watching files in: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files
+2024-04-11 04:02:08,683 INFO    SenderThread:455 [sender.py:_start_run_threads():1124] run started: txpa3x4k with start time 1712808128.135462
+2024-04-11 04:02:08,691 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: check_version
+2024-04-11 04:02:08,691 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: check_version
+2024-04-11 04:02:08,778 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: run_start
+2024-04-11 04:02:08,790 DEBUG   HandlerThread:455 [system_info.py:__init__():26] System info init
+2024-04-11 04:02:08,790 DEBUG   HandlerThread:455 [system_info.py:__init__():41] System info init done
+2024-04-11 04:02:08,790 INFO    HandlerThread:455 [system_monitor.py:start():194] Starting system monitor
+2024-04-11 04:02:08,790 INFO    SystemMonitor:455 [system_monitor.py:_start():158] Starting system asset monitoring threads
+2024-04-11 04:02:08,791 INFO    SystemMonitor:455 [interfaces.py:start():190] Started cpu monitoring
+2024-04-11 04:02:08,791 INFO    SystemMonitor:455 [interfaces.py:start():190] Started disk monitoring
+2024-04-11 04:02:08,792 INFO    HandlerThread:455 [system_monitor.py:probe():214] Collecting system info
+2024-04-11 04:02:08,792 INFO    SystemMonitor:455 [interfaces.py:start():190] Started gpu monitoring
+2024-04-11 04:02:08,793 INFO    SystemMonitor:455 [interfaces.py:start():190] Started memory monitoring
+2024-04-11 04:02:08,793 INFO    SystemMonitor:455 [interfaces.py:start():190] Started network monitoring
+2024-04-11 04:02:08,804 DEBUG   HandlerThread:455 [system_info.py:probe():150] Probing system
+2024-04-11 04:02:08,807 DEBUG   HandlerThread:455 [gitlib.py:_init_repo():56] git repository is invalid
+2024-04-11 04:02:08,807 DEBUG   HandlerThread:455 [system_info.py:probe():198] Probing system done
+2024-04-11 04:02:08,807 DEBUG   HandlerThread:455 [system_monitor.py:probe():223] {'os': 'Linux-5.15.133+-x86_64-with-glibc2.31', 'python': '3.10.13', 'heartbeatAt': '2024-04-11T04:02:08.804959', 'startedAt': '2024-04-11T04:02:08.129415', 'docker': None, 'cuda': None, 'args': (), 'state': 'running', 'program': 'kaggle.ipynb', 'codePathLocal': None, 'root': '/kaggle/working', 'host': '321ddc84c049', 'username': 'root', 'executable': '/opt/conda/bin/python3.10', 'cpu_count': 2, 'cpu_count_logical': 4, 'cpu_freq': {'current': 2000.19, 'min': 0.0, 'max': 0.0}, 'cpu_freq_per_core': [{'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}], 'disk': {'/': {'total': 8062.387607574463, 'used': 5566.961982727051}}, 'gpu': 'Tesla T4', 'gpu_count': 2, 'gpu_devices': [{'name': 'Tesla T4', 'memory_total': 16106127360}, {'name': 'Tesla T4', 'memory_total': 16106127360}], 'memory': {'total': 31.357559204101562}}
+2024-04-11 04:02:08,807 INFO    HandlerThread:455 [system_monitor.py:probe():224] Finished collecting system info
+2024-04-11 04:02:08,807 INFO    HandlerThread:455 [system_monitor.py:probe():227] Publishing system info
+2024-04-11 04:02:08,807 DEBUG   HandlerThread:455 [system_info.py:_save_conda():207] Saving list of conda packages installed into the current environment
+2024-04-11 04:02:09,685 INFO    Thread-12 :455 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/conda-environment.yaml
+2024-04-11 04:02:23,823 ERROR   HandlerThread:455 [system_info.py:_save_conda():221] Error saving conda packages: Command '['conda', 'env', 'export']' timed out after 15 seconds
+Traceback (most recent call last):
+  File "/opt/conda/lib/python3.10/site-packages/wandb/sdk/internal/system/system_info.py", line 214, in _save_conda
+    subprocess.call(
+  File "/opt/conda/lib/python3.10/subprocess.py", line 347, in call
+    return p.wait(timeout=timeout)
+  File "/opt/conda/lib/python3.10/subprocess.py", line 1209, in wait
+    return self._wait(timeout=timeout)
+  File "/opt/conda/lib/python3.10/subprocess.py", line 1951, in _wait
+    raise TimeoutExpired(self.args, timeout)
+subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after 15 seconds
+2024-04-11 04:02:23,824 DEBUG   HandlerThread:455 [system_info.py:_save_conda():222] Saving conda packages done
+2024-04-11 04:02:23,825 INFO    HandlerThread:455 [system_monitor.py:probe():229] Finished publishing system info
+2024-04-11 04:02:23,830 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:02:23,830 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 04:02:23,830 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:02:23,830 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 04:02:23,830 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:02:23,830 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 04:02:23,831 DEBUG   SenderThread:455 [sender.py:send():379] send: files
+2024-04-11 04:02:23,831 INFO    SenderThread:455 [sender.py:_save_file():1390] saving file wandb-metadata.json with policy now
+2024-04-11 04:02:24,033 INFO    wandb-upload_0:455 [upload_job.py:push():131] Uploaded file /tmp/tmp1s3x48hcwandb/4qm5hpvk-wandb-metadata.json
+2024-04-11 04:02:24,688 INFO    Thread-12 :455 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/wandb-metadata.json
+2024-04-11 04:02:24,755 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: python_packages
+2024-04-11 04:02:24,756 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: python_packages
+2024-04-11 04:02:24,757 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:02:24,758 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:02:24,795 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:02:24,805 DEBUG   SenderThread:455 [sender.py:send():379] send: telemetry
+2024-04-11 04:02:24,805 DEBUG   SenderThread:455 [sender.py:send():379] send: config
+2024-04-11 04:02:24,807 DEBUG   SenderThread:455 [sender.py:send():379] send: metric
+2024-04-11 04:02:24,808 DEBUG   SenderThread:455 [sender.py:send():379] send: telemetry
+2024-04-11 04:02:24,808 DEBUG   SenderThread:455 [sender.py:send():379] send: metric
+2024-04-11 04:02:24,808 WARNING SenderThread:455 [sender.py:send_metric():1341] Seen metric with glob (shouldn't happen)
+2024-04-11 04:02:24,808 DEBUG   SenderThread:455 [sender.py:send():379] send: telemetry
+2024-04-11 04:02:25,688 INFO    Thread-12 :455 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:02:25,689 INFO    Thread-12 :455 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/requirements.txt
+2024-04-11 04:02:27,689 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:02:29,171 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:02:29,690 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:02:34,172 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:02:39,178 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:02:39,693 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/config.yaml
+2024-04-11 04:02:40,355 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:02:40,355 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:02:40,358 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:02:44,408 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:02:49,409 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:02:54,410 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:02:55,351 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:02:55,352 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:02:55,392 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:03:00,394 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:05,395 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:08,794 DEBUG   SystemMonitor:455 [system_monitor.py:_start():172] Starting system metrics aggregation loop
+2024-04-11 04:03:08,795 DEBUG   SenderThread:455 [sender.py:send():379] send: stats
+2024-04-11 04:03:10,353 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:03:10,353 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:03:10,394 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:03:10,420 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:12,619 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: partial_history
+2024-04-11 04:03:12,622 DEBUG   SenderThread:455 [sender.py:send():379] send: metric
+2024-04-11 04:03:12,623 DEBUG   SenderThread:455 [sender.py:send():379] send: metric
+2024-04-11 04:03:12,623 DEBUG   SenderThread:455 [sender.py:send():379] send: metric
+2024-04-11 04:03:12,623 DEBUG   SenderThread:455 [sender.py:send():379] send: metric
+2024-04-11 04:03:12,623 DEBUG   SenderThread:455 [sender.py:send():379] send: history
+2024-04-11 04:03:12,623 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:03:12,623 INFO    SenderThread:455 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:03:12,709 INFO    Thread-12 :455 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/wandb-summary.json
+2024-04-11 04:03:15,592 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:15,710 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:03:17,711 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:03:20,730 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:25,368 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:03:25,368 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:03:25,409 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:03:26,469 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:31,470 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:36,471 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:38,796 DEBUG   SenderThread:455 [sender.py:send():379] send: stats
+2024-04-11 04:03:40,358 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:03:40,358 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:03:40,359 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:03:42,393 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:42,721 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/config.yaml
+2024-04-11 04:03:47,526 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:52,527 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:55,357 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:03:55,358 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:03:55,359 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:03:57,341 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: partial_history
+2024-04-11 04:03:57,342 DEBUG   SenderThread:455 [sender.py:send():379] send: history
+2024-04-11 04:03:57,343 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:03:57,345 INFO    SenderThread:455 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:03:57,727 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/wandb-summary.json
+2024-04-11 04:03:58,374 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:03:59,728 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:04:01,729 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:04:03,528 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:04:03,729 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:04:08,529 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:04:08,797 DEBUG   SenderThread:455 [sender.py:send():379] send: stats
+2024-04-11 04:04:09,554 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: pause
+2024-04-11 04:04:09,554 INFO    HandlerThread:455 [handler.py:handle_request_pause():708] stopping system metrics thread
+2024-04-11 04:04:09,554 INFO    HandlerThread:455 [system_monitor.py:finish():203] Stopping system monitor
+2024-04-11 04:04:09,554 DEBUG   SystemMonitor:455 [system_monitor.py:_start():179] Finished system metrics aggregation loop
+2024-04-11 04:04:09,554 DEBUG   SystemMonitor:455 [system_monitor.py:_start():183] Publishing last batch of metrics
+2024-04-11 04:04:09,555 INFO    HandlerThread:455 [interfaces.py:finish():202] Joined cpu monitor
+2024-04-11 04:04:09,555 INFO    HandlerThread:455 [interfaces.py:finish():202] Joined disk monitor
+2024-04-11 04:04:09,567 INFO    HandlerThread:455 [interfaces.py:finish():202] Joined gpu monitor
+2024-04-11 04:04:09,567 INFO    HandlerThread:455 [interfaces.py:finish():202] Joined memory monitor
+2024-04-11 04:04:09,567 INFO    HandlerThread:455 [interfaces.py:finish():202] Joined network monitor
+2024-04-11 04:04:09,568 DEBUG   SenderThread:455 [sender.py:send():379] send: stats
+2024-04-11 04:04:10,358 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:04:10,358 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:04:10,359 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:04:14,201 DEBUG   SenderThread:455 [sender.py:send():379] send: exit
+2024-04-11 04:04:14,201 INFO    SenderThread:455 [sender.py:send_exit():586] handling exit code: 0
+2024-04-11 04:04:14,201 INFO    SenderThread:455 [sender.py:send_exit():588] handling runtime: 120
+2024-04-11 04:04:14,201 INFO    SenderThread:455 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:04:14,202 INFO    SenderThread:455 [sender.py:send_exit():594] send defer
+2024-04-11 04:04:14,202 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,202 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 0
+2024-04-11 04:04:14,202 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:04:14,202 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,202 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 0
+2024-04-11 04:04:14,202 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 1
+2024-04-11 04:04:14,203 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,203 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 1
+2024-04-11 04:04:14,203 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,203 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 1
+2024-04-11 04:04:14,203 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 2
+2024-04-11 04:04:14,203 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,203 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 2
+2024-04-11 04:04:14,203 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,204 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 2
+2024-04-11 04:04:14,204 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 3
+2024-04-11 04:04:14,204 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,204 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 3
+2024-04-11 04:04:14,204 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,204 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 3
+2024-04-11 04:04:14,204 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 4
+2024-04-11 04:04:14,204 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,204 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 4
+2024-04-11 04:04:14,204 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,205 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 4
+2024-04-11 04:04:14,205 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 5
+2024-04-11 04:04:14,205 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,205 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 5
+2024-04-11 04:04:14,205 DEBUG   SenderThread:455 [sender.py:send():379] send: summary
+2024-04-11 04:04:14,206 INFO    SenderThread:455 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:04:14,206 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,206 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 5
+2024-04-11 04:04:14,206 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 6
+2024-04-11 04:04:14,206 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,206 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 6
+2024-04-11 04:04:14,206 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,206 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 6
+2024-04-11 04:04:14,206 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 7
+2024-04-11 04:04:14,207 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:04:14,207 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,207 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 7
+2024-04-11 04:04:14,207 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,207 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 7
+2024-04-11 04:04:14,733 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/wandb-summary.json
+2024-04-11 04:04:14,942 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 8
+2024-04-11 04:04:14,942 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,943 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 8
+2024-04-11 04:04:14,943 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,943 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 8
+2024-04-11 04:04:14,943 INFO    SenderThread:455 [job_builder.py:build():318] Attempting to build job artifact
+2024-04-11 04:04:14,945 INFO    SenderThread:455 [job_builder.py:_get_source_type():466] no source found
+2024-04-11 04:04:14,945 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 9
+2024-04-11 04:04:14,945 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:14,945 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 9
+2024-04-11 04:04:14,945 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:14,946 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 9
+2024-04-11 04:04:14,946 INFO    SenderThread:455 [dir_watcher.py:finish():358] shutting down directory watcher
+2024-04-11 04:04:15,201 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:04:15,734 INFO    Thread-12 :455 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:04:15,735 INFO    SenderThread:455 [dir_watcher.py:finish():388] scan: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files
+2024-04-11 04:04:15,735 INFO    SenderThread:455 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/config.yaml config.yaml
+2024-04-11 04:04:15,735 INFO    SenderThread:455 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/requirements.txt requirements.txt
+2024-04-11 04:04:15,738 INFO    SenderThread:455 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/conda-environment.yaml conda-environment.yaml
+2024-04-11 04:04:15,739 INFO    SenderThread:455 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/wandb-summary.json wandb-summary.json
+2024-04-11 04:04:15,739 INFO    SenderThread:455 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/wandb-metadata.json wandb-metadata.json
+2024-04-11 04:04:15,739 INFO    SenderThread:455 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log output.log
+2024-04-11 04:04:15,742 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 10
+2024-04-11 04:04:15,742 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:04:15,743 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:15,743 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 10
+2024-04-11 04:04:15,749 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:15,749 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 10
+2024-04-11 04:04:15,749 INFO    SenderThread:455 [file_pusher.py:finish():172] shutting down file pusher
+2024-04-11 04:04:15,892 INFO    wandb-upload_0:455 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/config.yaml
+2024-04-11 04:04:15,944 INFO    wandb-upload_1:455 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/requirements.txt
+2024-04-11 04:04:15,965 INFO    wandb-upload_3:455 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/output.log
+2024-04-11 04:04:15,966 INFO    wandb-upload_2:455 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_040208-txpa3x4k/files/wandb-summary.json
+2024-04-11 04:04:16,167 INFO    Thread-11 (_thread_body):455 [sender.py:transition_state():614] send defer: 11
+2024-04-11 04:04:16,167 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:16,168 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 11
+2024-04-11 04:04:16,168 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:16,168 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 11
+2024-04-11 04:04:16,168 INFO    SenderThread:455 [file_pusher.py:join():178] waiting for file pusher
+2024-04-11 04:04:16,169 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 12
+2024-04-11 04:04:16,169 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:16,169 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 12
+2024-04-11 04:04:16,169 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:16,169 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 12
+2024-04-11 04:04:16,169 INFO    SenderThread:455 [file_stream.py:finish():614] file stream finish called
+2024-04-11 04:04:16,202 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:04:16,257 INFO    SenderThread:455 [file_stream.py:finish():618] file stream finish is done
+2024-04-11 04:04:16,257 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 13
+2024-04-11 04:04:16,257 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:04:16,258 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:16,258 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 13
+2024-04-11 04:04:16,258 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:16,258 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 13
+2024-04-11 04:04:16,258 INFO    SenderThread:455 [sender.py:transition_state():614] send defer: 14
+2024-04-11 04:04:16,258 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:04:16,259 INFO    HandlerThread:455 [handler.py:handle_request_defer():172] handle defer: 14
+2024-04-11 04:04:16,259 DEBUG   SenderThread:455 [sender.py:send():379] send: final
+2024-04-11 04:04:16,259 DEBUG   SenderThread:455 [sender.py:send():379] send: footer
+2024-04-11 04:04:16,259 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:04:16,259 INFO    SenderThread:455 [sender.py:send_request_defer():610] handle sender defer: 14
+2024-04-11 04:04:16,260 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:04:16,260 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:04:16,261 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:04:16,261 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:04:16,262 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: server_info
+2024-04-11 04:04:16,262 DEBUG   SenderThread:455 [sender.py:send_request():406] send_request: server_info
+2024-04-11 04:04:16,265 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: get_summary
+2024-04-11 04:04:16,266 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: sampled_history
+2024-04-11 04:04:16,267 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:04:16,277 INFO    MainThread:455 [wandb_run.py:_footer_history_summary_info():3920] rendering history
+2024-04-11 04:04:16,277 INFO    MainThread:455 [wandb_run.py:_footer_history_summary_info():3952] rendering summary
+2024-04-11 04:04:16,278 INFO    MainThread:455 [wandb_run.py:_footer_sync_info():3879] logging synced files
+2024-04-11 04:04:16,278 DEBUG   HandlerThread:455 [handler.py:handle_request():146] handle_request: shutdown
+2024-04-11 04:04:16,278 INFO    HandlerThread:455 [handler.py:finish():866] shutting down handler
+2024-04-11 04:04:17,262 INFO    WriterThread:455 [datastore.py:close():296] close: /kaggle/working/wandb/run-20240411_040208-txpa3x4k/run-txpa3x4k.wandb
+2024-04-11 04:04:17,267 WARNING StreamThr :455 [internal.py:is_dead():414] Internal process exiting, parent pid 414 disappeared
+2024-04-11 04:04:17,268 ERROR   StreamThr :455 [internal.py:wandb_internal():152] Internal process shutdown.
+2024-04-11 04:04:17,277 INFO    SenderThread:455 [sender.py:finish():1546] shutting down sender
+2024-04-11 04:04:17,277 INFO    SenderThread:455 [file_pusher.py:finish():172] shutting down file pusher
+2024-04-11 04:04:17,277 INFO    SenderThread:455 [file_pusher.py:join():178] waiting for file pusher

wandb/run-20240411_040208-txpa3x4k/logs/debug.log ADDED Viewed

	@@ -0,0 +1,33 @@

+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_setup.py:_flush():76] Configure stats pid to 414
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_setup.py:_flush():76] Loading settings from /kaggle/working/wandb/settings
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program': '<python with no main file>'}
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_setup.py:_flush():76] Applying login settings: {}
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_init.py:_log_setup():527] Logging user logs to /kaggle/working/wandb/run-20240411_040208-txpa3x4k/logs/debug.log
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_init.py:_log_setup():528] Logging internal logs to /kaggle/working/wandb/run-20240411_040208-txpa3x4k/logs/debug-internal.log
+2024-04-11 04:02:08,131 INFO    MainThread:414 [wandb_init.py:_jupyter_setup():473] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x79289283df90>
+2024-04-11 04:02:08,132 INFO    MainThread:414 [wandb_init.py:init():567] calling init triggers
+2024-04-11 04:02:08,132 INFO    MainThread:414 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
+config: {}
+2024-04-11 04:02:08,132 INFO    MainThread:414 [wandb_init.py:init():617] starting backend
+2024-04-11 04:02:08,132 INFO    MainThread:414 [wandb_init.py:init():621] setting up manager
+2024-04-11 04:02:08,134 INFO    MainThread:414 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-04-11 04:02:08,135 INFO    MainThread:414 [wandb_init.py:init():629] backend started and connected
+2024-04-11 04:02:08,148 INFO    MainThread:414 [wandb_run.py:_label_probe_notebook():1299] probe notebook
+2024-04-11 04:02:08,531 INFO    MainThread:414 [wandb_init.py:init():721] updated telemetry
+2024-04-11 04:02:08,534 INFO    MainThread:414 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
+2024-04-11 04:02:08,691 INFO    MainThread:414 [wandb_run.py:_on_init():2344] communicating current version
+2024-04-11 04:02:08,772 INFO    MainThread:414 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.16.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2024-04-11 04:02:08,772 INFO    MainThread:414 [wandb_init.py:init():805] starting run threads in backend
+2024-04-11 04:02:24,756 INFO    MainThread:414 [wandb_run.py:_console_start():2323] atexit reg
+2024-04-11 04:02:24,757 INFO    MainThread:414 [wandb_run.py:_redirect():2178] redirect: wrap_raw
+2024-04-11 04:02:24,757 INFO    MainThread:414 [wandb_run.py:_redirect():2243] Wrapping output streams.
+2024-04-11 04:02:24,758 INFO    MainThread:414 [wandb_run.py:_redirect():2268] Redirects installed.
+2024-04-11 04:02:24,759 INFO    MainThread:414 [wandb_init.py:init():848] run started, returning control to user process
+2024-04-11 04:02:24,765 INFO    MainThread:414 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 250880, 'hidden_size': 1024, 'n_layer': 24, 'n_head': 16, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'use_cache': False, 'pretraining_tp': 1, 'apply_residual_connection_post_layernorm': False, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'bos_token_id': 1, 'eos_token_id': 2, 'slow_but_exact': False, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['BloomForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': 3, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'bigscience/bloomz-560m', 'transformers_version': '4.39.3', 'attention_softmax_in_fp32': True, 'bias_dropout_fusion': True, 'unk_token_id': 0, 'masked_softmax_fusion': True, 'model_type': 'bloom', 'n_inner': None, 'offset_alibi': 100, 'seq_length': 2048, 'skip_bias_add': True, 'skip_bias_add_qkv': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 7000, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_04-02-02_321ddc84c049', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_32bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}
+2024-04-11 04:04:09,553 INFO    MainThread:414 [jupyter.py:save_ipynb():373] not saving jupyter notebook
+2024-04-11 04:04:09,553 INFO    MainThread:414 [wandb_init.py:_pause_backend():438] pausing backend

wandb/run-20240411_040208-txpa3x4k/run-txpa3x4k.wandb ADDED Viewed

Binary file (15 kB). View file

wandb/run-20240411_040455-4dprer7c/files/conda-environment.yaml ADDED Viewed

File without changes

wandb/run-20240411_040455-4dprer7c/files/config.yaml ADDED Viewed

	@@ -0,0 +1,701 @@

+wandb_version: 1
+_wandb:
+  desc: null
+  value:
+    python_version: 3.10.13
+    cli_version: 0.16.5
+    framework: huggingface
+    huggingface_version: 4.39.3
+    is_jupyter_run: true
+    is_kaggle_kernel: true
+    start_time: 1712808295.0
+    t:
+      1:
+      - 1
+      - 2
+      - 3
+      - 5
+      - 11
+      - 12
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      - 98
+      - 105
+      2:
+      - 1
+      - 2
+      - 3
+      - 5
+      - 11
+      - 12
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      - 98
+      - 105
+      3:
+      - 7
+      - 23
+      4: 3.10.13
+      5: 0.16.5
+      6: 4.39.3
+      8:
+      - 1
+      - 2
+      - 5
+      9:
+        1: transformers_trainer
+      13: linux-x86_64
+    m:
+    - 1: train/global_step
+      6:
+      - 3
+    - 1: train/loss
+      5: 1
+      6:
+      - 1
+    - 1: train/grad_norm
+      5: 1
+      6:
+      - 1
+    - 1: train/learning_rate
+      5: 1
+      6:
+      - 1
+    - 1: train/epoch
+      5: 1
+      6:
+      - 1
+vocab_size:
+  desc: null
+  value: 250880
+hidden_size:
+  desc: null
+  value: 1024
+n_layer:
+  desc: null
+  value: 24
+n_head:
+  desc: null
+  value: 16
+layer_norm_epsilon:
+  desc: null
+  value: 1.0e-05
+initializer_range:
+  desc: null
+  value: 0.02
+use_cache:
+  desc: null
+  value: false
+pretraining_tp:
+  desc: null
+  value: 1
+apply_residual_connection_post_layernorm:
+  desc: null
+  value: false
+hidden_dropout:
+  desc: null
+  value: 0.0
+attention_dropout:
+  desc: null
+  value: 0.0
+bos_token_id:
+  desc: null
+  value: 1
+eos_token_id:
+  desc: null
+  value: 2
+slow_but_exact:
+  desc: null
+  value: false
+return_dict:
+  desc: null
+  value: true
+output_hidden_states:
+  desc: null
+  value: false
+output_attentions:
+  desc: null
+  value: false
+torchscript:
+  desc: null
+  value: false
+torch_dtype:
+  desc: null
+  value: null
+use_bfloat16:
+  desc: null
+  value: false
+tf_legacy_loss:
+  desc: null
+  value: false
+pruned_heads:
+  desc: null
+  value: {}
+tie_word_embeddings:
+  desc: null
+  value: true
+chunk_size_feed_forward:
+  desc: null
+  value: 0
+is_encoder_decoder:
+  desc: null
+  value: false
+is_decoder:
+  desc: null
+  value: false
+cross_attention_hidden_size:
+  desc: null
+  value: null
+add_cross_attention:
+  desc: null
+  value: false
+tie_encoder_decoder:
+  desc: null
+  value: false
+max_length:
+  desc: null
+  value: 20
+min_length:
+  desc: null
+  value: 0
+do_sample:
+  desc: null
+  value: false
+early_stopping:
+  desc: null
+  value: false
+num_beams:
+  desc: null
+  value: 1
+num_beam_groups:
+  desc: null
+  value: 1
+diversity_penalty:
+  desc: null
+  value: 0.0
+temperature:
+  desc: null
+  value: 1.0
+top_k:
+  desc: null
+  value: 50
+top_p:
+  desc: null
+  value: 1.0
+typical_p:
+  desc: null
+  value: 1.0
+repetition_penalty:
+  desc: null
+  value: 1.0
+length_penalty:
+  desc: null
+  value: 1.0
+no_repeat_ngram_size:
+  desc: null
+  value: 0
+encoder_no_repeat_ngram_size:
+  desc: null
+  value: 0
+bad_words_ids:
+  desc: null
+  value: null
+num_return_sequences:
+  desc: null
+  value: 1
+output_scores:
+  desc: null
+  value: false
+return_dict_in_generate:
+  desc: null
+  value: false
+forced_bos_token_id:
+  desc: null
+  value: null
+forced_eos_token_id:
+  desc: null
+  value: null
+remove_invalid_values:
+  desc: null
+  value: false
+exponential_decay_length_penalty:
+  desc: null
+  value: null
+suppress_tokens:
+  desc: null
+  value: null
+begin_suppress_tokens:
+  desc: null
+  value: null
+architectures:
+  desc: null
+  value:
+  - BloomForCausalLM
+finetuning_task:
+  desc: null
+  value: null
+id2label:
+  desc: null
+  value:
+    '0': LABEL_0
+    '1': LABEL_1
+label2id:
+  desc: null
+  value:
+    LABEL_0: 0
+    LABEL_1: 1
+tokenizer_class:
+  desc: null
+  value: null
+prefix:
+  desc: null
+  value: null
+pad_token_id:
+  desc: null
+  value: 3
+sep_token_id:
+  desc: null
+  value: null
+decoder_start_token_id:
+  desc: null
+  value: null
+task_specific_params:
+  desc: null
+  value: null
+problem_type:
+  desc: null
+  value: null
+_name_or_path:
+  desc: null
+  value: bigscience/bloomz-560m
+transformers_version:
+  desc: null
+  value: 4.39.3
+attention_softmax_in_fp32:
+  desc: null
+  value: true
+bias_dropout_fusion:
+  desc: null
+  value: true
+unk_token_id:
+  desc: null
+  value: 0
+masked_softmax_fusion:
+  desc: null
+  value: true
+model_type:
+  desc: null
+  value: bloom
+n_inner:
+  desc: null
+  value: null
+offset_alibi:
+  desc: null
+  value: 100
+seq_length:
+  desc: null
+  value: 2048
+skip_bias_add:
+  desc: null
+  value: true
+skip_bias_add_qkv:
+  desc: null
+  value: false
+quantization_config:
+  desc: null
+  value:
+    quant_method: QuantizationMethod.BITS_AND_BYTES
+    _load_in_8bit: false
+    _load_in_4bit: true
+    llm_int8_threshold: 6.0
+    llm_int8_skip_modules: null
+    llm_int8_enable_fp32_cpu_offload: false
+    llm_int8_has_fp16_weight: false
+    bnb_4bit_quant_type: nf4
+    bnb_4bit_use_double_quant: false
+    bnb_4bit_compute_dtype: float16
+    bnb_4bit_quant_storage: uint8
+    load_in_4bit: true
+    load_in_8bit: false
+output_dir:
+  desc: null
+  value: /kaggle/working/
+overwrite_output_dir:
+  desc: null
+  value: false
+do_train:
+  desc: null
+  value: false
+do_eval:
+  desc: null
+  value: false
+do_predict:
+  desc: null
+  value: false
+evaluation_strategy:
+  desc: null
+  value: 'no'
+prediction_loss_only:
+  desc: null
+  value: false
+per_device_train_batch_size:
+  desc: null
+  value: 8
+per_device_eval_batch_size:
+  desc: null
+  value: 8
+per_gpu_train_batch_size:
+  desc: null
+  value: null
+per_gpu_eval_batch_size:
+  desc: null
+  value: null
+gradient_accumulation_steps:
+  desc: null
+  value: 1
+eval_accumulation_steps:
+  desc: null
+  value: null
+eval_delay:
+  desc: null
+  value: 0
+learning_rate:
+  desc: null
+  value: 3.0e-05
+weight_decay:
+  desc: null
+  value: 0.001
+adam_beta1:
+  desc: null
+  value: 0.9
+adam_beta2:
+  desc: null
+  value: 0.999
+adam_epsilon:
+  desc: null
+  value: 1.0e-08
+max_grad_norm:
+  desc: null
+  value: 0.3
+num_train_epochs:
+  desc: null
+  value: 5
+max_steps:
+  desc: null
+  value: 18000
+lr_scheduler_type:
+  desc: null
+  value: cosine
+lr_scheduler_kwargs:
+  desc: null
+  value: {}
+warmup_ratio:
+  desc: null
+  value: 0.03
+warmup_steps:
+  desc: null
+  value: 0
+log_level:
+  desc: null
+  value: passive
+log_level_replica:
+  desc: null
+  value: warning
+log_on_each_node:
+  desc: null
+  value: true
+logging_dir:
+  desc: null
+  value: /kaggle/working/runs/Apr11_04-04-49_321ddc84c049
+logging_strategy:
+  desc: null
+  value: steps
+logging_first_step:
+  desc: null
+  value: false
+logging_steps:
+  desc: null
+  value: 20
+logging_nan_inf_filter:
+  desc: null
+  value: true
+save_strategy:
+  desc: null
+  value: steps
+save_steps:
+  desc: null
+  value: 20
+save_total_limit:
+  desc: null
+  value: 1
+save_safetensors:
+  desc: null
+  value: true
+save_on_each_node:
+  desc: null
+  value: false
+save_only_model:
+  desc: null
+  value: false
+no_cuda:
+  desc: null
+  value: false
+use_cpu:
+  desc: null
+  value: false
+use_mps_device:
+  desc: null
+  value: false
+seed:
+  desc: null
+  value: 42
+data_seed:
+  desc: null
+  value: null
+jit_mode_eval:
+  desc: null
+  value: false
+use_ipex:
+  desc: null
+  value: false
+bf16:
+  desc: null
+  value: false
+fp16:
+  desc: null
+  value: false
+fp16_opt_level:
+  desc: null
+  value: O1
+half_precision_backend:
+  desc: null
+  value: auto
+bf16_full_eval:
+  desc: null
+  value: false
+fp16_full_eval:
+  desc: null
+  value: false
+tf32:
+  desc: null
+  value: null
+local_rank:
+  desc: null
+  value: 0
+ddp_backend:
+  desc: null
+  value: null
+tpu_num_cores:
+  desc: null
+  value: null
+tpu_metrics_debug:
+  desc: null
+  value: false
+debug:
+  desc: null
+  value: []
+dataloader_drop_last:
+  desc: null
+  value: false
+eval_steps:
+  desc: null
+  value: null
+dataloader_num_workers:
+  desc: null
+  value: 8
+dataloader_prefetch_factor:
+  desc: null
+  value: null
+past_index:
+  desc: null
+  value: -1
+run_name:
+  desc: null
+  value: /kaggle/working/
+disable_tqdm:
+  desc: null
+  value: false
+remove_unused_columns:
+  desc: null
+  value: true
+label_names:
+  desc: null
+  value: null
+load_best_model_at_end:
+  desc: null
+  value: false
+metric_for_best_model:
+  desc: null
+  value: null
+greater_is_better:
+  desc: null
+  value: null
+ignore_data_skip:
+  desc: null
+  value: false
+fsdp:
+  desc: null
+  value: []
+fsdp_min_num_params:
+  desc: null
+  value: 0
+fsdp_config:
+  desc: null
+  value:
+    min_num_params: 0
+    xla: false
+    xla_fsdp_v2: false
+    xla_fsdp_grad_ckpt: false
+fsdp_transformer_layer_cls_to_wrap:
+  desc: null
+  value: null
+accelerator_config:
+  desc: null
+  value:
+    split_batches: false
+    dispatch_batches: null
+    even_batches: true
+    use_seedable_sampler: true
+deepspeed:
+  desc: null
+  value: null
+label_smoothing_factor:
+  desc: null
+  value: 0.0
+optim:
+  desc: null
+  value: paged_adamw_32bit
+optim_args:
+  desc: null
+  value: null
+adafactor:
+  desc: null
+  value: false
+group_by_length:
+  desc: null
+  value: false
+length_column_name:
+  desc: null
+  value: length
+report_to:
+  desc: null
+  value:
+  - tensorboard
+  - wandb
+ddp_find_unused_parameters:
+  desc: null
+  value: null
+ddp_bucket_cap_mb:
+  desc: null
+  value: null
+ddp_broadcast_buffers:
+  desc: null
+  value: null
+dataloader_pin_memory:
+  desc: null
+  value: true
+dataloader_persistent_workers:
+  desc: null
+  value: false
+skip_memory_metrics:
+  desc: null
+  value: true
+use_legacy_prediction_loop:
+  desc: null
+  value: false
+push_to_hub:
+  desc: null
+  value: false
+resume_from_checkpoint:
+  desc: null
+  value: null
+hub_model_id:
+  desc: null
+  value: null
+hub_strategy:
+  desc: null
+  value: every_save
+hub_token:
+  desc: null
+  value: <HUB_TOKEN>
+hub_private_repo:
+  desc: null
+  value: false
+hub_always_push:
+  desc: null
+  value: false
+gradient_checkpointing:
+  desc: null
+  value: true
+gradient_checkpointing_kwargs:
+  desc: null
+  value: null
+include_inputs_for_metrics:
+  desc: null
+  value: false
+fp16_backend:
+  desc: null
+  value: auto
+push_to_hub_model_id:
+  desc: null
+  value: null
+push_to_hub_organization:
+  desc: null
+  value: null
+push_to_hub_token:
+  desc: null
+  value: <PUSH_TO_HUB_TOKEN>
+mp_parameters:
+  desc: null
+  value: ''
+auto_find_batch_size:
+  desc: null
+  value: true
+full_determinism:
+  desc: null
+  value: false
+torchdynamo:
+  desc: null
+  value: null
+ray_scope:
+  desc: null
+  value: last
+ddp_timeout:
+  desc: null
+  value: 1800
+torch_compile:
+  desc: null
+  value: false
+torch_compile_backend:
+  desc: null
+  value: null
+torch_compile_mode:
+  desc: null
+  value: null
+dispatch_batches:
+  desc: null
+  value: null
+split_batches:
+  desc: null
+  value: null
+include_tokens_per_second:
+  desc: null
+  value: false
+include_num_input_tokens_seen:
+  desc: null
+  value: false
+neftune_noise_alpha:
+  desc: null
+  value: null
+optim_target_modules:
+  desc: null
+  value: null

wandb/run-20240411_040455-4dprer7c/files/output.log ADDED Viewed

	@@ -0,0 +1,12 @@

+/opt/conda/lib/python3.10/site-packages/torch/utils/data/dataloader.py:557: UserWarning: This DataLoader will create 8 worker processes in total. Our suggested max number of worker in current system is 4, which is smaller than what this DataLoader is going to create. Please be aware that excessive worker creation might get DataLoader running slow or even freeze, lower the worker number to avoid potential slowness/freeze if necessary.
+  warnings.warn(_create_warning_msg(
+/opt/conda/lib/python3.10/site-packages/torch/utils/checkpoint.py:429: UserWarning: torch.utils.checkpoint: please pass in use_reentrant=True or use_reentrant=False explicitly. The default value of use_reentrant will be updated to be False in the future. To maintain current behavior, pass use_reentrant=True. It is recommended that you use use_reentrant=False. Refer to docs for more details on the differences between the two variants.
+  warnings.warn(
+/opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
+  warnings.warn('Was asked to gather along dimension 0, but all '
+/opt/conda/lib/python3.10/site-packages/peft/utils/save_and_load.py:139: UserWarning: Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.
+  warnings.warn("Setting `save_embedding_layers` to `True` as embedding layers found in `target_modules`.")
+/opt/conda/lib/python3.10/site-packages/torch/utils/checkpoint.py:429: UserWarning: torch.utils.checkpoint: please pass in use_reentrant=True or use_reentrant=False explicitly. The default value of use_reentrant will be updated to be False in the future. To maintain current behavior, pass use_reentrant=True. It is recommended that you use use_reentrant=False. Refer to docs for more details on the differences between the two variants.
+  warnings.warn(
+/opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
+  warnings.warn('Was asked to gather along dimension 0, but all '

wandb/run-20240411_040455-4dprer7c/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,864 @@

+Babel==2.14.0
+Boruta==0.3
+Brotli==1.0.9
+CVXcanon==0.1.2
+Cartopy==0.22.0
+Cython==3.0.8
+Deprecated==1.2.14
+Farama-Notifications==0.0.4
+Flask==3.0.2
+Geohash==1.0
+GitPython==3.1.41
+ImageHash==4.3.1
+Janome==0.5.0
+Jinja2==3.1.2
+LunarCalendar==0.0.9
+Mako==1.3.2
+Markdown==3.5.2
+MarkupSafe==2.1.3
+MarkupSafe==2.1.5
+Pillow==9.5.0
+PuLP==2.8.0
+PyArabic==0.6.15
+PyJWT==2.8.0
+PyMeeus==0.5.12
+PySocks==1.7.1
+PyUpSet==0.1.1.post7
+PyWavelets==1.5.0
+PyYAML==6.0.1
+Pygments==2.17.2
+Pympler==1.0.1
+QtPy==2.4.1
+Rtree==1.2.0
+SQLAlchemy==2.0.25
+SecretStorage==3.3.3
+Send2Trash==1.8.2
+Shapely==1.8.5.post1
+Shimmy==1.3.0
+SimpleITK==2.3.1
+TPOT==0.12.1
+Theano-PyMC==1.1.2
+Theano==1.0.5
+Wand==0.6.13
+Werkzeug==3.0.2
+absl-py==1.4.0
+accelerate==0.28.0
+access==1.1.9
+affine==2.4.0
+aiobotocore==2.12.2
+aiofiles==22.1.0
+aiohttp-cors==0.7.0
+aiohttp==3.9.1
+aioitertools==0.11.0
+aiorwlock==1.3.0
+aiosignal==1.3.1
+aiosqlite==0.19.0
+albumentations==1.4.0
+alembic==1.13.1
+altair==5.3.0
+annotated-types==0.6.0
+annoy==1.17.3
+anyio==4.2.0
+apache-beam==2.46.0
+aplus==0.11.0
+appdirs==1.4.4
+archspec==0.2.3
+argon2-cffi-bindings==21.2.0
+argon2-cffi==23.1.0
+array-record==0.5.0
+arrow==1.3.0
+arviz==0.17.1
+astroid==3.1.0
+astropy-iers-data==0.2024.4.1.0.33.14
+astropy==6.0.1
+asttokens==2.4.1
+astunparse==1.6.3
+async-lru==2.0.4
+async-timeout==4.0.3
+attrs==23.2.0
+audioread==3.0.1
+autopep8==2.0.4
+backoff==2.2.1
+bayesian-optimization==1.4.3
+beatrix_jupyterlab==2023.128.151533
+beautifulsoup4==4.12.2
+bitsandbytes==0.43.0
+blake3==0.2.1
+bleach==6.1.0
+blessed==1.20.0
+blinker==1.7.0
+blis==0.7.10
+blosc2==2.6.0
+bokeh==3.3.4
+boltons==23.1.1
+boto3==1.26.100
+botocore==1.34.51
+bq_helper==0.4.1
+bqplot==0.12.43
+branca==0.7.1
+brewer2mpl==1.4.1
+brotlipy==0.7.0
+cached-property==1.5.2
+cachetools==4.2.4
+cachetools==5.3.2
+catalogue==2.0.10
+catalyst==22.4
+catboost==1.2.3
+category-encoders==2.6.3
+certifi==2024.2.2
+cesium==0.12.1
+cffi==1.16.0
+charset-normalizer==3.3.2
+chex==0.1.86
+cleverhans==4.0.0
+click-plugins==1.1.1
+click==8.1.7
+cligj==0.7.2
+cloud-tpu-client==0.10
+cloud-tpu-profiler==2.4.0
+cloudpathlib==0.16.0
+cloudpickle==2.2.1
+cloudpickle==3.0.0
+cmdstanpy==1.2.2
+colorama==0.4.6
+colorcet==3.1.0
+colorful==0.5.6
+colorlog==6.8.2
+colorlover==0.3.0
+comm==0.2.1
+conda-libmamba-solver==23.7.0
+conda-package-handling==2.2.0
+conda==23.7.4
+conda_package_streaming==0.9.0
+confection==0.1.4
+contextily==1.6.0
+contourpy==1.2.0
+convertdate==2.4.0
+crcmod==1.7
+cryptography==41.0.7
+cuda-python==12.4.0
+cudf==23.8.0
+cufflinks==0.17.3
+cuml==23.8.0
+cupy==13.0.0
+cycler==0.12.1
+cymem==2.0.8
+cytoolz==0.12.3
+daal4py==2024.2.0
+daal==2024.2.0
+dacite==1.8.1
+dask-cuda==23.8.0
+dask-cudf==23.8.0
+dask-expr==1.0.9
+dask==2024.4.0
+dataclasses-json==0.6.4
+dataproc_jupyter_plugin==0.1.66
+datasets==2.16.0
+datashader==0.16.0
+datatile==1.0.3
+db-dtypes==1.2.0
+deap==1.4.1
+debugpy==1.8.0
+decorator==5.1.1
+deepdiff==6.7.1
+defusedxml==0.7.1
+deprecation==2.1.0
+descartes==1.1.0
+dill==0.3.7
+dipy==1.9.0
+distlib==0.3.8
+distributed==2023.7.1
+distro==1.9.0
+dm-tree==0.1.8
+docker-pycreds==0.4.0
+docker==7.0.0
+docopt==0.6.2
+docstring-parser==0.15
+docstring-to-markdown==0.15
+docutils==0.20.1
+earthengine-api==0.1.395
+easydict==1.13
+easyocr==1.7.1
+ecos==2.0.13
+eli5==0.13.0
+emoji==2.11.0
+en-core-web-lg==3.7.1
+en-core-web-sm==3.7.1
+entrypoints==0.4
+ephem==4.1.5
+esda==2.5.1
+essentia==2.1b6.dev1110
+et-xmlfile==1.1.0
+etils==1.6.0
+exceptiongroup==1.2.0
+executing==2.0.1
+explainable-ai-sdk==1.3.3
+fastai==2.7.14
+fastapi==0.108.0
+fastavro==1.9.3
+fastcore==1.5.29
+fastdownload==0.0.7
+fasteners==0.19
+fastjsonschema==2.19.1
+fastprogress==1.0.3
+fastrlock==0.8.2
+fasttext==0.9.2
+feather-format==0.4.1
+featuretools==1.30.0
+filelock==3.13.1
+fiona==1.9.6
+fitter==1.7.0
+flake8==7.0.0
+flashtext==2.7
+flatbuffers==23.5.26
+flax==0.8.2
+folium==0.16.0
+fonttools==4.47.0
+fonttools==4.50.0
+fqdn==1.5.1
+frozendict==2.4.1
+frozenlist==1.4.1
+fsspec==2023.10.0
+fsspec==2024.3.1
+funcy==2.0
+fury==0.10.0
+future==1.0.0
+fuzzywuzzy==0.18.0
+gast==0.5.4
+gatspy==0.3
+gcsfs==2024.2.0
+gensim==4.3.2
+geographiclib==2.0
+geojson==3.1.0
+geopandas==0.14.3
+geoplot==0.5.1
+geopy==2.4.1
+geoviews==1.11.1
+ggplot==0.11.5
+giddy==2.3.5
+gitdb==4.0.11
+google-ai-generativelanguage==0.4.0
+google-api-core==2.11.1
+google-api-core==2.18.0
+google-api-python-client==2.125.0
+google-apitools==0.5.31
+google-auth-httplib2==0.2.0
+google-auth-oauthlib==1.2.0
+google-auth==2.26.1
+google-cloud-aiplatform==0.6.0a1
+google-cloud-artifact-registry==1.10.0
+google-cloud-automl==1.0.1
+google-cloud-bigquery==2.34.4
+google-cloud-bigtable==1.7.3
+google-cloud-core==2.4.1
+google-cloud-datastore==2.19.0
+google-cloud-dlp==3.14.0
+google-cloud-jupyter-config==0.0.5
+google-cloud-language==2.13.3
+google-cloud-monitoring==2.18.0
+google-cloud-pubsub==2.19.0
+google-cloud-pubsublite==1.9.0
+google-cloud-recommendations-ai==0.7.1
+google-cloud-resource-manager==1.11.0
+google-cloud-spanner==3.40.1
+google-cloud-storage==1.44.0
+google-cloud-translate==3.12.1
+google-cloud-videointelligence==2.13.3
+google-cloud-vision==2.8.0
+google-crc32c==1.5.0
+google-generativeai==0.4.1
+google-pasta==0.2.0
+google-resumable-media==2.7.0
+googleapis-common-protos==1.62.0
+gplearn==0.4.2
+gpustat==1.0.0
+gpxpy==1.6.2
+graphviz==0.20.3
+greenlet==3.0.3
+grpc-google-iam-v1==0.12.7
+grpcio-status==1.48.1
+grpcio-status==1.48.2
+grpcio==1.51.1
+grpcio==1.60.0
+gviz-api==1.10.0
+gym-notices==0.0.8
+gym==0.26.2
+gymnasium==0.29.0
+h11==0.14.0
+h2o==3.46.0.1
+h5netcdf==1.3.0
+h5py==3.10.0
+haversine==2.8.1
+hdfs==2.7.3
+hep-ml==0.7.2
+hijri-converter==2.3.1
+hmmlearn==0.3.2
+holidays==0.24
+holoviews==1.18.3
+hpsklearn==0.1.0
+html5lib==1.1
+htmlmin==0.1.12
+httpcore==1.0.5
+httplib2==0.21.0
+httptools==0.6.1
+httpx==0.27.0
+huggingface-hub==0.22.2
+hunspell==0.5.5
+hydra-slayer==0.5.0
+hyperopt==0.2.7
+hypertools==0.8.0
+idna==3.6
+igraph==0.11.4
+imagecodecs==2024.1.1
+imageio==2.33.1
+imbalanced-learn==0.12.2
+imgaug==0.4.0
+importlib-metadata==6.11.0
+importlib-metadata==7.0.1
+importlib-resources==6.1.1
+inequality==1.0.1
+iniconfig==2.0.0
+ipydatawidgets==4.3.5
+ipykernel==6.28.0
+ipyleaflet==0.18.2
+ipympl==0.7.0
+ipython-genutils==0.2.0
+ipython-genutils==0.2.0
+ipython-sql==0.5.0
+ipython==8.20.0
+ipyvolume==0.6.3
+ipyvue==1.10.2
+ipyvuetify==1.9.3
+ipywebrtc==0.6.0
+ipywidgets==7.7.1
+isoduration==20.11.0
+isort==5.13.2
+isoweek==1.3.3
+itsdangerous==2.1.2
+jaraco.classes==3.3.0
+jax-jumpy==1.0.0
+jax==0.4.23
+jaxlib==0.4.23.dev20240116
+jedi==0.19.1
+jeepney==0.8.0
+jieba==0.42.1
+jmespath==1.0.1
+joblib==1.3.2
+json5==0.9.14
+jsonpatch==1.33
+jsonpointer==2.4
+jsonschema-specifications==2023.12.1
+jsonschema==4.20.0
+jupyter-console==6.6.3
+jupyter-events==0.9.0
+jupyter-http-over-ws==0.0.8
+jupyter-lsp==1.5.1
+jupyter-server-mathjax==0.2.6
+jupyter-ydoc==0.2.5
+jupyter_client==7.4.9
+jupyter_client==8.6.0
+jupyter_core==5.7.1
+jupyter_server==2.13.0
+jupyter_server_fileid==0.9.1
+jupyter_server_proxy==4.1.0
+jupyter_server_terminals==0.5.1
+jupyter_server_ydoc==0.8.0
+jupyterlab-lsp==5.1.0
+jupyterlab-widgets==3.0.9
+jupyterlab==4.1.5
+jupyterlab_git==0.44.0
+jupyterlab_pygments==0.3.0
+jupyterlab_server==2.25.2
+jupytext==1.16.0
+kaggle-environments==1.14.3
+kaggle==1.6.8
+kagglehub==0.2.2
+keras-cv==0.8.2
+keras-nlp==0.8.2
+keras-tuner==1.4.6
+keras==3.1.1
+kernels-mixer==0.0.7
+keyring==24.3.0
+keyrings.google-artifactregistry-auth==1.1.2
+kfp-pipeline-spec==0.2.2
+kfp-server-api==2.0.5
+kfp==2.5.0
+kiwisolver==1.4.5
+kmapper==2.0.1
+kmodes==0.12.2
+korean-lunar-calendar==0.3.1
+kornia==0.7.2
+kornia_rs==0.1.3
+kt-legacy==1.0.5
+kubernetes==26.1.0
+langcodes==3.3.0
+langid==1.1.6
+lazy_loader==0.3
+learntools==0.3.4
+leven==1.0.4
+libclang==16.0.6
+libmambapy==1.5.0
+libpysal==4.9.2
+librosa==0.10.1
+lightgbm==4.2.0
+lightning-utilities==0.11.2
+lime==0.2.0.1
+line-profiler==4.1.2
+linkify-it-py==2.0.3
+llvmlite==0.41.1
+llvmlite==0.42.0
+lml==0.1.0
+locket==1.0.0
+loguru==0.7.2
+lxml==5.2.1
+lz4==4.3.3
+mamba==1.5.0
+mapclassify==2.6.1
+markdown-it-py==3.0.0
+marshmallow==3.21.1
+matplotlib-inline==0.1.6
+matplotlib-venn==0.11.10
+matplotlib==3.7.5
+matplotlib==3.8.3
+mccabe==0.7.0
+mdit-py-plugins==0.4.0
+mdurl==0.1.2
+memory-profiler==0.61.0
+menuinst==2.0.1
+mercantile==1.2.1
+mgwr==2.2.1
+missingno==0.5.2
+mistune==0.8.4
+mizani==0.11.1
+ml-dtypes==0.2.0
+mlcrate==0.2.0
+mlens==0.2.3
+mlxtend==0.23.1
+mne==1.6.1
+mnist==0.2.2
+momepy==0.7.0
+more-itertools==10.2.0
+mpld3==0.5.10
+mpmath==1.3.0
+msgpack==1.0.7
+multidict==6.0.4
+multimethod==1.10
+multipledispatch==1.0.0
+multiprocess==0.70.15
+munkres==1.1.4
+murmurhash==1.0.10
+mypy-extensions==1.0.0
+namex==0.0.7
+nb-conda-kernels==2.3.1
+nb_conda==2.2.1
+nbclassic==1.0.0
+nbclient==0.5.13
+nbconvert==6.4.5
+nbdime==3.2.0
+nbformat==5.9.2
+ndindex==1.8
+nest-asyncio==1.5.8
+networkx==3.2.1
+nibabel==5.2.1
+nilearn==0.10.3
+ninja==1.11.1.1
+nltk==3.2.4
+nose==1.3.7
+notebook==6.5.4
+notebook==6.5.6
+notebook_executor==0.2
+notebook_shim==0.2.3
+numba==0.58.1
+numba==0.59.1
+numexpr==2.10.0
+numpy==1.26.4
+nvidia-ml-py==11.495.46
+nvtx==0.2.10
+oauth2client==4.1.3
+oauthlib==3.2.2
+objsize==0.6.1
+odfpy==1.4.1
+olefile==0.47
+onnx==1.16.0
+opencensus-context==0.1.3
+opencensus==0.11.4
+opencv-contrib-python==4.9.0.80
+opencv-python-headless==4.9.0.80
+opencv-python==4.9.0.80
+openpyxl==3.1.2
+openslide-python==1.3.1
+opentelemetry-api==1.22.0
+opentelemetry-exporter-otlp-proto-common==1.22.0
+opentelemetry-exporter-otlp-proto-grpc==1.22.0
+opentelemetry-exporter-otlp-proto-http==1.22.0
+opentelemetry-exporter-otlp==1.22.0
+opentelemetry-proto==1.22.0
+opentelemetry-sdk==1.22.0
+opentelemetry-semantic-conventions==0.43b0
+opt-einsum==3.3.0
+optax==0.2.2
+optree==0.11.0
+optuna==3.6.1
+orbax-checkpoint==0.5.7
+ordered-set==4.1.0
+orjson==3.9.10
+ortools==9.4.1874
+osmnx==1.9.2
+overrides==7.4.0
+packaging==21.3
+pandas-datareader==0.10.0
+pandas-profiling==3.6.6
+pandas-summary==0.2.0
+pandas==2.1.4
+pandas==2.2.1
+pandasql==0.7.3
+pandocfilters==1.5.0
+panel==1.3.8
+papermill==2.5.0
+param==2.1.0
+parso==0.8.3
+partd==1.4.1
+path.py==12.5.0
+path==16.10.0
+pathos==0.3.2
+pathy==0.10.3
+patsy==0.5.6
+pdf2image==1.17.0
+peft==0.10.0
+pettingzoo==1.24.0
+pexpect==4.8.0
+pexpect==4.9.0
+phik==0.12.4
+pickleshare==0.7.5
+pillow==10.3.0
+pip==23.3.2
+pkgutil_resolve_name==1.3.10
+platformdirs==4.2.0
+plotly-express==0.4.1
+plotly==5.18.0
+plotnine==0.13.4
+pluggy==1.4.0
+pointpats==2.4.0
+polars==0.20.18
+polyglot==16.7.4
+pooch==1.8.1
+pox==0.3.4
+ppca==0.0.4
+ppft==1.7.6.8
+preprocessing==0.1.13
+preshed==3.0.9
+prettytable==3.9.0
+progressbar2==4.4.2
+prometheus-client==0.19.0
+promise==2.3
+prompt-toolkit==3.0.42
+prompt-toolkit==3.0.43
+prophet==1.1.1
+proto-plus==1.23.0
+protobuf==3.20.3
+protobuf==4.21.12
+psutil==5.9.3
+psutil==5.9.7
+ptyprocess==0.7.0
+pudb==2024.1
+pure-eval==0.2.2
+py-cpuinfo==9.0.0
+py-spy==0.3.14
+py4j==0.10.9.7
+pyLDAvis==3.4.1
+pyOpenSSL==23.3.0
+pyaml==23.12.0
+pyarrow-hotfix==0.6
+pyarrow==15.0.2
+pyasn1-modules==0.3.0
+pyasn1==0.5.1
+pybind11==2.12.0
+pyclipper==1.3.0.post5
+pycodestyle==2.11.1
+pycosat==0.6.6
+pycparser==2.21
+pycryptodome==3.20.0
+pyct==0.5.0
+pycuda==2024.1
+pydantic==2.5.3
+pydantic==2.6.4
+pydantic_core==2.14.6
+pydantic_core==2.16.3
+pydegensac==0.1.2
+pydicom==2.4.4
+pydocstyle==6.3.0
+pydot==1.4.2
+pydub==0.25.1
+pyemd==1.0.0
+pyerfa==2.0.1.1
+pyexcel-io==0.6.6
+pyexcel-ods==0.6.0
+pyflakes==3.2.0
+pygltflib==1.16.2
+pykalman==0.9.7
+pylibraft==23.8.0
+pylint==3.1.0
+pymc3==3.11.4
+pymongo==3.13.0
+pynndescent==0.5.12
+pynvml==11.4.1
+pynvrtc==9.2
+pyparsing==3.1.1
+pyparsing==3.1.2
+pypdf==4.1.0
+pyproj==3.6.1
+pysal==24.1
+pyshp==2.3.1
+pytesseract==0.3.10
+pytest==8.1.1
+python-bidi==0.4.2
+python-dateutil==2.9.0.post0
+python-dotenv==1.0.0
+python-json-logger==2.0.7
+python-louvain==0.16
+python-lsp-jsonrpc==1.1.2
+python-lsp-server==1.11.0
+python-slugify==8.0.4
+python-utils==3.8.2
+pythreejs==2.4.2
+pytoolconfig==1.3.1
+pytools==2024.1.1
+pytorch-ignite==0.5.0.post2
+pytorch-lightning==2.2.1
+pytz==2023.3.post1
+pytz==2024.1
+pyu2f==0.1.5
+pyviz_comms==3.0.2
+pyzmq==24.0.1
+pyzmq==25.1.2
+qgrid==1.3.1
+qtconsole==5.5.1
+quantecon==0.7.2
+qudida==0.0.4
+raft-dask==23.8.0
+rasterio==1.3.9
+rasterstats==0.19.0
+ray-cpp==2.9.0
+ray==2.9.0
+referencing==0.32.1
+regex==2023.12.25
+requests-oauthlib==1.3.1
+requests-toolbelt==0.10.1
+requests==2.31.0
+retrying==1.3.3
+retrying==1.3.4
+rfc3339-validator==0.1.4
+rfc3986-validator==0.1.1
+rgf-python==3.12.0
+rich-click==1.7.4
+rich==13.7.0
+rich==13.7.1
+rmm==23.8.0
+rope==1.13.0
+rpds-py==0.16.2
+rsa==4.9
+ruamel-yaml-conda==0.15.100
+ruamel.yaml.clib==0.2.7
+ruamel.yaml==0.17.40
+s2sphere==0.2.5
+s3fs==2024.2.0
+s3transfer==0.6.2
+safetensors==0.4.2
+scattertext==0.1.19
+scikit-image==0.22.0
+scikit-learn-intelex==2024.2.0
+scikit-learn==1.2.2
+scikit-multilearn==0.2.0
+scikit-optimize==0.10.1
+scikit-plot==0.3.7
+scikit-surprise==1.1.3
+scipy==1.11.4
+scipy==1.12.0
+seaborn==0.12.2
+segment_anything==1.0
+segregation==2.5
+semver==3.0.2
+sentencepiece==0.2.0
+sentry-sdk==1.44.1
+setproctitle==1.3.3
+setuptools-git==1.2
+setuptools-scm==8.0.4
+setuptools==69.0.3
+shap==0.44.1
+shapely==2.0.3
+shellingham==1.5.4
+shtab==1.7.1
+simpervisor==1.0.0
+simplejson==3.19.2
+six==1.16.0
+sklearn-pandas==2.2.0
+slicer==0.0.7
+smart-open==6.4.0
+smmap==5.0.1
+sniffio==1.3.0
+snowballstemmer==2.2.0
+snuggs==1.4.7
+sortedcontainers==2.4.0
+soundfile==0.12.1
+soupsieve==2.5
+soxr==0.3.7
+spacy-legacy==3.0.12
+spacy-loggers==1.0.5
+spacy==3.7.2
+spaghetti==1.7.5.post1
+spectral==0.23.1
+spglm==1.1.0
+sphinx-rtd-theme==0.2.4
+spint==1.0.7
+splot==1.1.5.post1
+spopt==0.6.0
+spreg==1.4.2
+spvcm==0.3.0
+sqlparse==0.4.4
+squarify==0.4.3
+srsly==2.4.8
+stable-baselines3==2.1.0
+stack-data==0.6.2
+stack-data==0.6.3
+stanio==0.5.0
+starlette==0.32.0.post1
+statsmodels==0.14.1
+stemming==1.0.1
+stop-words==2018.7.23
+stopit==1.1.2
+stumpy==1.12.0
+sympy==1.12
+tables==3.9.2
+tabulate==0.9.0
+tangled-up-in-unicode==0.2.0
+tbb==2021.12.0
+tblib==3.0.0
+tenacity==8.2.3
+tensorboard-data-server==0.7.2
+tensorboard-plugin-profile==2.15.0
+tensorboard==2.15.1
+tensorboardX==2.6.2.2
+tensorflow-cloud==0.1.16
+tensorflow-datasets==4.9.4
+tensorflow-decision-forests==1.8.1
+tensorflow-estimator==2.15.0
+tensorflow-hub==0.16.1
+tensorflow-io-gcs-filesystem==0.35.0
+tensorflow-io==0.35.0
+tensorflow-metadata==0.14.0
+tensorflow-probability==0.23.0
+tensorflow-serving-api==2.14.1
+tensorflow-text==2.15.0
+tensorflow-transform==0.14.0
+tensorflow==2.15.0
+tensorstore==0.1.56
+termcolor==2.4.0
+terminado==0.18.0
+testpath==0.6.0
+text-unidecode==1.3
+textblob==0.18.0.post0
+texttable==1.7.0
+tf_keras==2.15.1
+tfp-nightly==0.24.0.dev0
+thinc==8.2.2
+threadpoolctl==3.2.0
+tifffile==2023.12.9
+timm==0.9.16
+tinycss2==1.2.1
+tobler==0.11.2
+tokenizers==0.15.2
+toml==0.10.2
+tomli==2.0.1
+tomlkit==0.12.4
+toolz==0.12.1
+torch==2.1.2
+torchaudio==2.1.2
+torchdata==0.7.1
+torchinfo==1.8.0
+torchmetrics==1.3.2
+torchtext==0.16.2
+torchvision==0.16.2
+tornado==6.3.3
+tqdm==4.66.1
+traceml==1.0.8
+traitlets==5.9.0
+traittypes==0.2.1
+transformers==4.39.3
+treelite-runtime==3.2.0
+treelite==3.2.0
+trl==0.8.1
+truststore==0.8.0
+trx-python==0.2.9
+tsfresh==0.20.2
+typeguard==4.1.5
+typer==0.9.0
+typer==0.9.4
+types-python-dateutil==2.8.19.20240106
+typing-inspect==0.9.0
+typing-utils==0.1.0
+typing_extensions==4.9.0
+tyro==0.8.3
+tzdata==2023.4
+uc-micro-py==1.0.3
+ucx-py==0.33.0
+ujson==5.9.0
+umap-learn==0.5.5
+unicodedata2==15.1.0
+update-checker==0.18.0
+uri-template==1.3.0
+uritemplate==3.0.1
+urllib3==1.26.18
+urllib3==2.1.0
+urwid==2.6.10
+urwid_readline==0.14
+uvicorn==0.25.0
+uvloop==0.19.0
+vaex-astro==0.9.3
+vaex-core==4.17.1
+vaex-hdf5==0.14.1
+vaex-jupyter==0.8.2
+vaex-ml==0.18.3
+vaex-server==0.9.0
+vaex-viz==0.5.4
+vaex==4.17.0
+vec_noise==1.1.4
+vecstack==0.4.0
+virtualenv==20.21.0
+visions==0.7.5
+vowpalwabbit==9.9.0
+vtk==9.3.0
+wandb==0.16.5
+wasabi==1.1.2
+watchfiles==0.21.0
+wavio==0.0.8
+wcwidth==0.2.13
+weasel==0.3.4
+webcolors==1.13
+webencodings==0.5.1
+websocket-client==1.7.0
+websockets==12.0
+wfdb==4.1.2
+whatthepatch==1.0.5
+wheel==0.42.0
+widgetsnbextension==3.6.6
+witwidget==1.8.1
+woodwork==0.29.0
+wordcloud==1.9.3
+wordsegment==1.3.1
+wrapt==1.14.1
+xarray-einstats==0.7.0
+xarray==2024.3.0
+xgboost==2.0.3
+xvfbwrapper==0.2.9
+xxhash==3.4.1
+xyzservices==2023.10.1
+y-py==0.6.2
+yapf==0.40.2
+yarl==1.9.3
+yarl==1.9.4
+ydata-profiling==4.6.4
+yellowbrick==1.5
+ypy-websocket==0.8.4
+zict==3.0.0
+zipp==3.17.0
+zstandard==0.22.0

wandb/run-20240411_040455-4dprer7c/files/wandb-metadata.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+    "os": "Linux-5.15.133+-x86_64-with-glibc2.31",
+    "python": "3.10.13",
+    "heartbeatAt": "2024-04-11T04:04:56.368183",
+    "startedAt": "2024-04-11T04:04:55.701503",
+    "docker": null,
+    "cuda": null,
+    "args": [],
+    "state": "running",
+    "program": "kaggle.ipynb",
+    "codePathLocal": null,
+    "root": "/kaggle/working",
+    "host": "321ddc84c049",
+    "username": "root",
+    "executable": "/opt/conda/bin/python3.10",
+    "cpu_count": 2,
+    "cpu_count_logical": 4,
+    "cpu_freq": {
+        "current": 2000.19,
+        "min": 0.0,
+        "max": 0.0
+    },
+    "cpu_freq_per_core": [
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        }
+    ],
+    "disk": {
+        "/": {
+            "total": 8062.387607574463,
+            "used": 5566.962100982666
+        }
+    },
+    "gpu": "Tesla T4",
+    "gpu_count": 2,
+    "gpu_devices": [
+        {
+            "name": "Tesla T4",
+            "memory_total": 16106127360
+        },
+        {
+            "name": "Tesla T4",
+            "memory_total": 16106127360
+        }
+    ],
+    "memory": {
+        "total": 31.357559204101562
+    }
+}

wandb/run-20240411_040455-4dprer7c/files/wandb-summary.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"train/loss": 30.0974, "train/grad_norm": 258.19573974609375, "train/learning_rate": 1.111111111111111e-06, "train/epoch": 0.0, "train/global_step": 20, "_timestamp": 1712808360.9619126, "_runtime": 65.25462675094604, "_step": 0, "_wandb": {"runtime": 106}}

wandb/run-20240411_040455-4dprer7c/logs/debug-internal.log ADDED Viewed

	@@ -0,0 +1,254 @@

+2024-04-11 04:04:55,708 INFO    StreamThr :781 [internal.py:wandb_internal():86] W&B internal server running at pid: 781, started at: 2024-04-11 04:04:55.707378
+2024-04-11 04:04:55,709 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status
+2024-04-11 04:04:56,097 INFO    WriterThread:781 [datastore.py:open_for_write():87] open: /kaggle/working/wandb/run-20240411_040455-4dprer7c/run-4dprer7c.wandb
+2024-04-11 04:04:56,097 DEBUG   SenderThread:781 [sender.py:send():379] send: header
+2024-04-11 04:04:56,100 DEBUG   SenderThread:781 [sender.py:send():379] send: run
+2024-04-11 04:04:56,242 INFO    SenderThread:781 [dir_watcher.py:__init__():211] watching files in: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files
+2024-04-11 04:04:56,242 INFO    SenderThread:781 [sender.py:_start_run_threads():1124] run started: 4dprer7c with start time 1712808295.707286
+2024-04-11 04:04:56,250 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: check_version
+2024-04-11 04:04:56,250 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: check_version
+2024-04-11 04:04:56,338 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: run_start
+2024-04-11 04:04:56,349 DEBUG   HandlerThread:781 [system_info.py:__init__():26] System info init
+2024-04-11 04:04:56,349 DEBUG   HandlerThread:781 [system_info.py:__init__():41] System info init done
+2024-04-11 04:04:56,349 INFO    HandlerThread:781 [system_monitor.py:start():194] Starting system monitor
+2024-04-11 04:04:56,349 INFO    SystemMonitor:781 [system_monitor.py:_start():158] Starting system asset monitoring threads
+2024-04-11 04:04:56,349 INFO    HandlerThread:781 [system_monitor.py:probe():214] Collecting system info
+2024-04-11 04:04:56,350 INFO    SystemMonitor:781 [interfaces.py:start():190] Started cpu monitoring
+2024-04-11 04:04:56,351 INFO    SystemMonitor:781 [interfaces.py:start():190] Started disk monitoring
+2024-04-11 04:04:56,352 INFO    SystemMonitor:781 [interfaces.py:start():190] Started gpu monitoring
+2024-04-11 04:04:56,352 INFO    SystemMonitor:781 [interfaces.py:start():190] Started memory monitoring
+2024-04-11 04:04:56,353 INFO    SystemMonitor:781 [interfaces.py:start():190] Started network monitoring
+2024-04-11 04:04:56,368 DEBUG   HandlerThread:781 [system_info.py:probe():150] Probing system
+2024-04-11 04:04:56,370 DEBUG   HandlerThread:781 [gitlib.py:_init_repo():56] git repository is invalid
+2024-04-11 04:04:56,370 DEBUG   HandlerThread:781 [system_info.py:probe():198] Probing system done
+2024-04-11 04:04:56,370 DEBUG   HandlerThread:781 [system_monitor.py:probe():223] {'os': 'Linux-5.15.133+-x86_64-with-glibc2.31', 'python': '3.10.13', 'heartbeatAt': '2024-04-11T04:04:56.368183', 'startedAt': '2024-04-11T04:04:55.701503', 'docker': None, 'cuda': None, 'args': (), 'state': 'running', 'program': 'kaggle.ipynb', 'codePathLocal': None, 'root': '/kaggle/working', 'host': '321ddc84c049', 'username': 'root', 'executable': '/opt/conda/bin/python3.10', 'cpu_count': 2, 'cpu_count_logical': 4, 'cpu_freq': {'current': 2000.19, 'min': 0.0, 'max': 0.0}, 'cpu_freq_per_core': [{'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}, {'current': 2000.19, 'min': 0.0, 'max': 0.0}], 'disk': {'/': {'total': 8062.387607574463, 'used': 5566.962100982666}}, 'gpu': 'Tesla T4', 'gpu_count': 2, 'gpu_devices': [{'name': 'Tesla T4', 'memory_total': 16106127360}, {'name': 'Tesla T4', 'memory_total': 16106127360}], 'memory': {'total': 31.357559204101562}}
+2024-04-11 04:04:56,370 INFO    HandlerThread:781 [system_monitor.py:probe():224] Finished collecting system info
+2024-04-11 04:04:56,370 INFO    HandlerThread:781 [system_monitor.py:probe():227] Publishing system info
+2024-04-11 04:04:56,370 DEBUG   HandlerThread:781 [system_info.py:_save_conda():207] Saving list of conda packages installed into the current environment
+2024-04-11 04:04:57,244 INFO    Thread-12 :781 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/conda-environment.yaml
+2024-04-11 04:05:11,386 ERROR   HandlerThread:781 [system_info.py:_save_conda():221] Error saving conda packages: Command '['conda', 'env', 'export']' timed out after 15 seconds
+Traceback (most recent call last):
+  File "/opt/conda/lib/python3.10/site-packages/wandb/sdk/internal/system/system_info.py", line 214, in _save_conda
+    subprocess.call(
+  File "/opt/conda/lib/python3.10/subprocess.py", line 347, in call
+    return p.wait(timeout=timeout)
+  File "/opt/conda/lib/python3.10/subprocess.py", line 1209, in wait
+    return self._wait(timeout=timeout)
+  File "/opt/conda/lib/python3.10/subprocess.py", line 1951, in _wait
+    raise TimeoutExpired(self.args, timeout)
+subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after 15 seconds
+2024-04-11 04:05:11,386 DEBUG   HandlerThread:781 [system_info.py:_save_conda():222] Saving conda packages done
+2024-04-11 04:05:11,387 INFO    HandlerThread:781 [system_monitor.py:probe():229] Finished publishing system info
+2024-04-11 04:05:11,392 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:11,393 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 04:05:11,393 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:11,393 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 04:05:11,393 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:11,393 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: keepalive
+2024-04-11 04:05:11,393 DEBUG   SenderThread:781 [sender.py:send():379] send: files
+2024-04-11 04:05:11,394 INFO    SenderThread:781 [sender.py:_save_file():1390] saving file wandb-metadata.json with policy now
+2024-04-11 04:05:11,591 INFO    wandb-upload_0:781 [upload_job.py:push():131] Uploaded file /tmp/tmp48h4betowandb/odf1mr1f-wandb-metadata.json
+2024-04-11 04:05:12,247 INFO    Thread-12 :781 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/wandb-metadata.json
+2024-04-11 04:05:12,360 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: python_packages
+2024-04-11 04:05:12,360 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: python_packages
+2024-04-11 04:05:12,363 DEBUG   SenderThread:781 [sender.py:send():379] send: telemetry
+2024-04-11 04:05:12,373 DEBUG   SenderThread:781 [sender.py:send():379] send: config
+2024-04-11 04:05:12,375 DEBUG   SenderThread:781 [sender.py:send():379] send: metric
+2024-04-11 04:05:12,376 DEBUG   SenderThread:781 [sender.py:send():379] send: telemetry
+2024-04-11 04:05:12,377 DEBUG   SenderThread:781 [sender.py:send():379] send: metric
+2024-04-11 04:05:12,377 WARNING SenderThread:781 [sender.py:send_metric():1341] Seen metric with glob (shouldn't happen)
+2024-04-11 04:05:12,377 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:05:12,377 DEBUG   SenderThread:781 [sender.py:send():379] send: telemetry
+2024-04-11 04:05:12,378 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:05:12,379 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:05:13,248 INFO    Thread-12 :781 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/output.log
+2024-04-11 04:05:13,248 INFO    Thread-12 :781 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/requirements.txt
+2024-04-11 04:05:15,249 INFO    Thread-12 :781 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/output.log
+2024-04-11 04:05:16,873 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:17,250 INFO    Thread-12 :781 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/output.log
+2024-04-11 04:05:21,874 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:26,880 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:27,254 INFO    Thread-12 :781 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/config.yaml
+2024-04-11 04:05:28,163 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:05:28,165 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:05:28,166 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:05:32,273 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:37,274 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:42,275 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:42,872 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:05:42,872 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:05:42,873 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:05:47,920 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:52,920 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:05:56,353 DEBUG   SystemMonitor:781 [system_monitor.py:_start():172] Starting system metrics aggregation loop
+2024-04-11 04:05:56,355 DEBUG   SenderThread:781 [sender.py:send():379] send: stats
+2024-04-11 04:05:57,869 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:05:57,870 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:05:57,903 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:05:58,904 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:00,962 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: partial_history
+2024-04-11 04:06:00,965 DEBUG   SenderThread:781 [sender.py:send():379] send: metric
+2024-04-11 04:06:00,965 DEBUG   SenderThread:781 [sender.py:send():379] send: metric
+2024-04-11 04:06:00,965 DEBUG   SenderThread:781 [sender.py:send():379] send: metric
+2024-04-11 04:06:00,965 DEBUG   SenderThread:781 [sender.py:send():379] send: metric
+2024-04-11 04:06:00,966 DEBUG   SenderThread:781 [sender.py:send():379] send: history
+2024-04-11 04:06:00,966 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: summary_record
+2024-04-11 04:06:00,966 INFO    SenderThread:781 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:06:01,267 INFO    Thread-12 :781 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/wandb-summary.json
+2024-04-11 04:06:03,268 INFO    Thread-12 :781 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/output.log
+2024-04-11 04:06:04,004 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:07,270 INFO    Thread-12 :781 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/output.log
+2024-04-11 04:06:09,172 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:12,869 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:06:12,870 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:06:12,873 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:06:14,934 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:19,934 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:24,936 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:26,356 DEBUG   SenderThread:781 [sender.py:send():379] send: stats
+2024-04-11 04:06:27,870 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:06:27,870 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:06:27,910 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:06:29,974 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:30,281 INFO    Thread-12 :781 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/config.yaml
+2024-04-11 04:06:35,067 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:40,068 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:42,978 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: pause
+2024-04-11 04:06:42,978 INFO    HandlerThread:781 [handler.py:handle_request_pause():708] stopping system metrics thread
+2024-04-11 04:06:42,978 INFO    HandlerThread:781 [system_monitor.py:finish():203] Stopping system monitor
+2024-04-11 04:06:42,978 INFO    HandlerThread:781 [interfaces.py:finish():202] Joined cpu monitor
+2024-04-11 04:06:42,979 INFO    HandlerThread:781 [interfaces.py:finish():202] Joined disk monitor
+2024-04-11 04:06:42,979 DEBUG   SystemMonitor:781 [system_monitor.py:_start():179] Finished system metrics aggregation loop
+2024-04-11 04:06:42,979 DEBUG   SystemMonitor:781 [system_monitor.py:_start():183] Publishing last batch of metrics
+2024-04-11 04:06:42,990 INFO    HandlerThread:781 [interfaces.py:finish():202] Joined gpu monitor
+2024-04-11 04:06:42,990 INFO    HandlerThread:781 [interfaces.py:finish():202] Joined memory monitor
+2024-04-11 04:06:42,990 INFO    HandlerThread:781 [interfaces.py:finish():202] Joined network monitor
+2024-04-11 04:06:42,991 DEBUG   SenderThread:781 [sender.py:send():379] send: stats
+2024-04-11 04:06:43,019 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: stop_status
+2024-04-11 04:06:43,019 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:06:43,019 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: stop_status
+2024-04-11 04:06:46,066 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:49,976 DEBUG   SenderThread:781 [sender.py:send():379] send: exit
+2024-04-11 04:06:49,976 INFO    SenderThread:781 [sender.py:send_exit():586] handling exit code: 0
+2024-04-11 04:06:49,976 INFO    SenderThread:781 [sender.py:send_exit():588] handling runtime: 106
+2024-04-11 04:06:49,977 INFO    SenderThread:781 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:06:49,977 INFO    SenderThread:781 [sender.py:send_exit():594] send defer
+2024-04-11 04:06:49,977 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:49,977 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 0
+2024-04-11 04:06:49,977 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:49,978 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 0
+2024-04-11 04:06:49,978 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 1
+2024-04-11 04:06:49,978 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:49,978 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 1
+2024-04-11 04:06:49,978 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:49,978 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 1
+2024-04-11 04:06:49,978 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 2
+2024-04-11 04:06:49,978 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:49,978 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 2
+2024-04-11 04:06:49,978 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:49,978 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 2
+2024-04-11 04:06:49,978 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 3
+2024-04-11 04:06:49,979 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:49,979 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 3
+2024-04-11 04:06:49,979 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:49,979 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 3
+2024-04-11 04:06:49,979 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 4
+2024-04-11 04:06:49,979 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:49,979 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 4
+2024-04-11 04:06:49,979 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:49,979 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 4
+2024-04-11 04:06:49,979 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 5
+2024-04-11 04:06:49,979 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:49,980 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 5
+2024-04-11 04:06:49,980 DEBUG   SenderThread:781 [sender.py:send():379] send: summary
+2024-04-11 04:06:49,980 INFO    SenderThread:781 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
+2024-04-11 04:06:49,980 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:49,981 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 5
+2024-04-11 04:06:49,981 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 6
+2024-04-11 04:06:49,981 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:49,981 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 6
+2024-04-11 04:06:49,981 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:49,981 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 6
+2024-04-11 04:06:49,981 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 7
+2024-04-11 04:06:49,981 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: status_report
+2024-04-11 04:06:49,981 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:49,981 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 7
+2024-04-11 04:06:49,982 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:49,982 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 7
+2024-04-11 04:06:50,288 INFO    Thread-12 :781 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/wandb-summary.json
+2024-04-11 04:06:50,499 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 8
+2024-04-11 04:06:50,499 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:50,499 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 8
+2024-04-11 04:06:50,499 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:50,499 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 8
+2024-04-11 04:06:50,500 INFO    SenderThread:781 [job_builder.py:build():318] Attempting to build job artifact
+2024-04-11 04:06:50,501 INFO    SenderThread:781 [job_builder.py:_get_source_type():466] no source found
+2024-04-11 04:06:50,502 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 9
+2024-04-11 04:06:50,502 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:50,502 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 9
+2024-04-11 04:06:50,502 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:50,502 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 9
+2024-04-11 04:06:50,502 INFO    SenderThread:781 [dir_watcher.py:finish():358] shutting down directory watcher
+2024-04-11 04:06:50,976 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:06:51,289 INFO    Thread-12 :781 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/output.log
+2024-04-11 04:06:51,289 INFO    SenderThread:781 [dir_watcher.py:finish():388] scan: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files
+2024-04-11 04:06:51,290 INFO    SenderThread:781 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/config.yaml config.yaml
+2024-04-11 04:06:51,290 INFO    SenderThread:781 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/requirements.txt requirements.txt
+2024-04-11 04:06:51,294 INFO    SenderThread:781 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/conda-environment.yaml conda-environment.yaml
+2024-04-11 04:06:51,298 INFO    SenderThread:781 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/wandb-summary.json wandb-summary.json
+2024-04-11 04:06:51,299 INFO    SenderThread:781 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/wandb-metadata.json wandb-metadata.json
+2024-04-11 04:06:51,303 INFO    SenderThread:781 [dir_watcher.py:finish():402] scan save: /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/output.log output.log
+2024-04-11 04:06:51,304 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 10
+2024-04-11 04:06:51,305 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:06:51,308 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:51,313 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 10
+2024-04-11 04:06:51,313 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:51,313 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 10
+2024-04-11 04:06:51,313 INFO    SenderThread:781 [file_pusher.py:finish():172] shutting down file pusher
+2024-04-11 04:06:51,460 INFO    wandb-upload_0:781 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/config.yaml
+2024-04-11 04:06:51,532 INFO    wandb-upload_1:781 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/requirements.txt
+2024-04-11 04:06:51,536 INFO    wandb-upload_3:781 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/output.log
+2024-04-11 04:06:51,604 INFO    wandb-upload_2:781 [upload_job.py:push():131] Uploaded file /kaggle/working/wandb/run-20240411_040455-4dprer7c/files/wandb-summary.json
+2024-04-11 04:06:51,804 INFO    Thread-11 (_thread_body):781 [sender.py:transition_state():614] send defer: 11
+2024-04-11 04:06:51,805 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:51,805 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 11
+2024-04-11 04:06:51,805 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:51,805 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 11
+2024-04-11 04:06:51,805 INFO    SenderThread:781 [file_pusher.py:join():178] waiting for file pusher
+2024-04-11 04:06:51,806 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 12
+2024-04-11 04:06:51,806 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:51,806 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 12
+2024-04-11 04:06:51,806 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:51,806 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 12
+2024-04-11 04:06:51,806 INFO    SenderThread:781 [file_stream.py:finish():614] file stream finish called
+2024-04-11 04:06:51,868 INFO    SenderThread:781 [file_stream.py:finish():618] file stream finish is done
+2024-04-11 04:06:51,869 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 13
+2024-04-11 04:06:51,869 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:51,869 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 13
+2024-04-11 04:06:51,869 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:51,869 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 13
+2024-04-11 04:06:51,869 INFO    SenderThread:781 [sender.py:transition_state():614] send defer: 14
+2024-04-11 04:06:51,869 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: defer
+2024-04-11 04:06:51,869 INFO    HandlerThread:781 [handler.py:handle_request_defer():172] handle defer: 14
+2024-04-11 04:06:51,870 DEBUG   SenderThread:781 [sender.py:send():379] send: final
+2024-04-11 04:06:51,870 DEBUG   SenderThread:781 [sender.py:send():379] send: footer
+2024-04-11 04:06:51,870 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: defer
+2024-04-11 04:06:51,870 INFO    SenderThread:781 [sender.py:send_request_defer():610] handle sender defer: 14
+2024-04-11 04:06:51,871 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:06:51,872 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:06:51,872 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: poll_exit
+2024-04-11 04:06:51,873 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: poll_exit
+2024-04-11 04:06:51,873 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: server_info
+2024-04-11 04:06:51,873 DEBUG   SenderThread:781 [sender.py:send_request():406] send_request: server_info
+2024-04-11 04:06:51,876 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: get_summary
+2024-04-11 04:06:51,876 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: sampled_history
+2024-04-11 04:06:51,877 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: internal_messages
+2024-04-11 04:06:51,888 INFO    MainThread:781 [wandb_run.py:_footer_history_summary_info():3920] rendering history
+2024-04-11 04:06:51,888 INFO    MainThread:781 [wandb_run.py:_footer_history_summary_info():3952] rendering summary
+2024-04-11 04:06:51,889 INFO    MainThread:781 [wandb_run.py:_footer_sync_info():3879] logging synced files
+2024-04-11 04:06:51,889 DEBUG   HandlerThread:781 [handler.py:handle_request():146] handle_request: shutdown
+2024-04-11 04:06:51,889 INFO    HandlerThread:781 [handler.py:finish():866] shutting down handler
+2024-04-11 04:06:52,873 INFO    WriterThread:781 [datastore.py:close():296] close: /kaggle/working/wandb/run-20240411_040455-4dprer7c/run-4dprer7c.wandb
+2024-04-11 04:06:52,888 INFO    SenderThread:781 [sender.py:finish():1546] shutting down sender
+2024-04-11 04:06:52,888 INFO    SenderThread:781 [file_pusher.py:finish():172] shutting down file pusher
+2024-04-11 04:06:52,888 INFO    SenderThread:781 [file_pusher.py:join():178] waiting for file pusher

wandb/run-20240411_040455-4dprer7c/logs/debug.log ADDED Viewed

	@@ -0,0 +1,33 @@

+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_setup.py:_flush():76] Configure stats pid to 740
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_setup.py:_flush():76] Loading settings from /kaggle/working/wandb/settings
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program': '<python with no main file>'}
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_setup.py:_flush():76] Applying login settings: {}
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_init.py:_log_setup():527] Logging user logs to /kaggle/working/wandb/run-20240411_040455-4dprer7c/logs/debug.log
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_init.py:_log_setup():528] Logging internal logs to /kaggle/working/wandb/run-20240411_040455-4dprer7c/logs/debug-internal.log
+2024-04-11 04:04:55,703 INFO    MainThread:740 [wandb_init.py:_jupyter_setup():473] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7805e5e25660>
+2024-04-11 04:04:55,704 INFO    MainThread:740 [wandb_init.py:init():567] calling init triggers
+2024-04-11 04:04:55,704 INFO    MainThread:740 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
+config: {}
+2024-04-11 04:04:55,704 INFO    MainThread:740 [wandb_init.py:init():617] starting backend
+2024-04-11 04:04:55,704 INFO    MainThread:740 [wandb_init.py:init():621] setting up manager
+2024-04-11 04:04:55,706 INFO    MainThread:740 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-04-11 04:04:55,707 INFO    MainThread:740 [wandb_init.py:init():629] backend started and connected
+2024-04-11 04:04:55,718 INFO    MainThread:740 [wandb_run.py:_label_probe_notebook():1299] probe notebook
+2024-04-11 04:04:56,096 INFO    MainThread:740 [wandb_init.py:init():721] updated telemetry
+2024-04-11 04:04:56,099 INFO    MainThread:740 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
+2024-04-11 04:04:56,249 INFO    MainThread:740 [wandb_run.py:_on_init():2344] communicating current version
+2024-04-11 04:04:56,332 INFO    MainThread:740 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.16.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2024-04-11 04:04:56,332 INFO    MainThread:740 [wandb_init.py:init():805] starting run threads in backend
+2024-04-11 04:05:12,361 INFO    MainThread:740 [wandb_run.py:_console_start():2323] atexit reg
+2024-04-11 04:05:12,361 INFO    MainThread:740 [wandb_run.py:_redirect():2178] redirect: wrap_raw
+2024-04-11 04:05:12,362 INFO    MainThread:740 [wandb_run.py:_redirect():2243] Wrapping output streams.
+2024-04-11 04:05:12,362 INFO    MainThread:740 [wandb_run.py:_redirect():2268] Redirects installed.
+2024-04-11 04:05:12,363 INFO    MainThread:740 [wandb_init.py:init():848] run started, returning control to user process
+2024-04-11 04:05:12,368 INFO    MainThread:740 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 250880, 'hidden_size': 1024, 'n_layer': 24, 'n_head': 16, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'use_cache': False, 'pretraining_tp': 1, 'apply_residual_connection_post_layernorm': False, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'bos_token_id': 1, 'eos_token_id': 2, 'slow_but_exact': False, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['BloomForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': 3, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'bigscience/bloomz-560m', 'transformers_version': '4.39.3', 'attention_softmax_in_fp32': True, 'bias_dropout_fusion': True, 'unk_token_id': 0, 'masked_softmax_fusion': True, 'model_type': 'bloom', 'n_inner': None, 'offset_alibi': 100, 'seq_length': 2048, 'skip_bias_add': True, 'skip_bias_add_qkv': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 18000, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_04-04-49_321ddc84c049', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_32bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}
+2024-04-11 04:06:42,977 INFO    MainThread:740 [jupyter.py:save_ipynb():373] not saving jupyter notebook
+2024-04-11 04:06:42,977 INFO    MainThread:740 [wandb_init.py:_pause_backend():438] pausing backend

wandb/run-20240411_040455-4dprer7c/run-4dprer7c.wandb ADDED Viewed

Binary file (13 kB). View file

wandb/run-20240411_040722-rimyh9a1/files/conda-environment.yaml ADDED Viewed

File without changes

wandb/run-20240411_040722-rimyh9a1/files/config.yaml ADDED Viewed

	@@ -0,0 +1,702 @@

+wandb_version: 1
+_wandb:
+  desc: null
+  value:
+    python_version: 3.10.13
+    cli_version: 0.16.5
+    framework: huggingface
+    huggingface_version: 4.39.3
+    is_jupyter_run: true
+    is_kaggle_kernel: true
+    start_time: 1712808442.0
+    t:
+      1:
+      - 1
+      - 2
+      - 3
+      - 5
+      - 11
+      - 12
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      - 98
+      - 105
+      2:
+      - 1
+      - 2
+      - 3
+      - 5
+      - 11
+      - 12
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      - 98
+      - 105
+      3:
+      - 7
+      - 23
+      - 62
+      4: 3.10.13
+      5: 0.16.5
+      6: 4.39.3
+      8:
+      - 1
+      - 2
+      - 5
+      9:
+        1: transformers_trainer
+      13: linux-x86_64
+    m:
+    - 1: train/global_step
+      6:
+      - 3
+    - 1: train/loss
+      5: 1
+      6:
+      - 1
+    - 1: train/grad_norm
+      5: 1
+      6:
+      - 1
+    - 1: train/learning_rate
+      5: 1
+      6:
+      - 1
+    - 1: train/epoch
+      5: 1
+      6:
+      - 1
+vocab_size:
+  desc: null
+  value: 250880
+hidden_size:
+  desc: null
+  value: 1024
+n_layer:
+  desc: null
+  value: 24
+n_head:
+  desc: null
+  value: 16
+layer_norm_epsilon:
+  desc: null
+  value: 1.0e-05
+initializer_range:
+  desc: null
+  value: 0.02
+use_cache:
+  desc: null
+  value: false
+pretraining_tp:
+  desc: null
+  value: 1
+apply_residual_connection_post_layernorm:
+  desc: null
+  value: false
+hidden_dropout:
+  desc: null
+  value: 0.0
+attention_dropout:
+  desc: null
+  value: 0.0
+bos_token_id:
+  desc: null
+  value: 1
+eos_token_id:
+  desc: null
+  value: 2
+slow_but_exact:
+  desc: null
+  value: false
+return_dict:
+  desc: null
+  value: true
+output_hidden_states:
+  desc: null
+  value: false
+output_attentions:
+  desc: null
+  value: false
+torchscript:
+  desc: null
+  value: false
+torch_dtype:
+  desc: null
+  value: null
+use_bfloat16:
+  desc: null
+  value: false
+tf_legacy_loss:
+  desc: null
+  value: false
+pruned_heads:
+  desc: null
+  value: {}
+tie_word_embeddings:
+  desc: null
+  value: true
+chunk_size_feed_forward:
+  desc: null
+  value: 0
+is_encoder_decoder:
+  desc: null
+  value: false
+is_decoder:
+  desc: null
+  value: false
+cross_attention_hidden_size:
+  desc: null
+  value: null
+add_cross_attention:
+  desc: null
+  value: false
+tie_encoder_decoder:
+  desc: null
+  value: false
+max_length:
+  desc: null
+  value: 20
+min_length:
+  desc: null
+  value: 0
+do_sample:
+  desc: null
+  value: false
+early_stopping:
+  desc: null
+  value: false
+num_beams:
+  desc: null
+  value: 1
+num_beam_groups:
+  desc: null
+  value: 1
+diversity_penalty:
+  desc: null
+  value: 0.0
+temperature:
+  desc: null
+  value: 1.0
+top_k:
+  desc: null
+  value: 50
+top_p:
+  desc: null
+  value: 1.0
+typical_p:
+  desc: null
+  value: 1.0
+repetition_penalty:
+  desc: null
+  value: 1.0
+length_penalty:
+  desc: null
+  value: 1.0
+no_repeat_ngram_size:
+  desc: null
+  value: 0
+encoder_no_repeat_ngram_size:
+  desc: null
+  value: 0
+bad_words_ids:
+  desc: null
+  value: null
+num_return_sequences:
+  desc: null
+  value: 1
+output_scores:
+  desc: null
+  value: false
+return_dict_in_generate:
+  desc: null
+  value: false
+forced_bos_token_id:
+  desc: null
+  value: null
+forced_eos_token_id:
+  desc: null
+  value: null
+remove_invalid_values:
+  desc: null
+  value: false
+exponential_decay_length_penalty:
+  desc: null
+  value: null
+suppress_tokens:
+  desc: null
+  value: null
+begin_suppress_tokens:
+  desc: null
+  value: null
+architectures:
+  desc: null
+  value:
+  - BloomForCausalLM
+finetuning_task:
+  desc: null
+  value: null
+id2label:
+  desc: null
+  value:
+    '0': LABEL_0
+    '1': LABEL_1
+label2id:
+  desc: null
+  value:
+    LABEL_0: 0
+    LABEL_1: 1
+tokenizer_class:
+  desc: null
+  value: null
+prefix:
+  desc: null
+  value: null
+pad_token_id:
+  desc: null
+  value: 3
+sep_token_id:
+  desc: null
+  value: null
+decoder_start_token_id:
+  desc: null
+  value: null
+task_specific_params:
+  desc: null
+  value: null
+problem_type:
+  desc: null
+  value: null
+_name_or_path:
+  desc: null
+  value: bigscience/bloomz-560m
+transformers_version:
+  desc: null
+  value: 4.39.3
+attention_softmax_in_fp32:
+  desc: null
+  value: true
+bias_dropout_fusion:
+  desc: null
+  value: true
+unk_token_id:
+  desc: null
+  value: 0
+masked_softmax_fusion:
+  desc: null
+  value: true
+model_type:
+  desc: null
+  value: bloom
+n_inner:
+  desc: null
+  value: null
+offset_alibi:
+  desc: null
+  value: 100
+seq_length:
+  desc: null
+  value: 2048
+skip_bias_add:
+  desc: null
+  value: true
+skip_bias_add_qkv:
+  desc: null
+  value: false
+quantization_config:
+  desc: null
+  value:
+    quant_method: QuantizationMethod.BITS_AND_BYTES
+    _load_in_8bit: false
+    _load_in_4bit: true
+    llm_int8_threshold: 6.0
+    llm_int8_skip_modules: null
+    llm_int8_enable_fp32_cpu_offload: false
+    llm_int8_has_fp16_weight: false
+    bnb_4bit_quant_type: nf4
+    bnb_4bit_use_double_quant: false
+    bnb_4bit_compute_dtype: float16
+    bnb_4bit_quant_storage: uint8
+    load_in_4bit: true
+    load_in_8bit: false
+output_dir:
+  desc: null
+  value: /kaggle/working/
+overwrite_output_dir:
+  desc: null
+  value: false
+do_train:
+  desc: null
+  value: false
+do_eval:
+  desc: null
+  value: false
+do_predict:
+  desc: null
+  value: false
+evaluation_strategy:
+  desc: null
+  value: 'no'
+prediction_loss_only:
+  desc: null
+  value: false
+per_device_train_batch_size:
+  desc: null
+  value: 8
+per_device_eval_batch_size:
+  desc: null
+  value: 8
+per_gpu_train_batch_size:
+  desc: null
+  value: null
+per_gpu_eval_batch_size:
+  desc: null
+  value: null
+gradient_accumulation_steps:
+  desc: null
+  value: 1
+eval_accumulation_steps:
+  desc: null
+  value: null
+eval_delay:
+  desc: null
+  value: 0
+learning_rate:
+  desc: null
+  value: 3.0e-05
+weight_decay:
+  desc: null
+  value: 0.001
+adam_beta1:
+  desc: null
+  value: 0.9
+adam_beta2:
+  desc: null
+  value: 0.999
+adam_epsilon:
+  desc: null
+  value: 1.0e-08
+max_grad_norm:
+  desc: null
+  value: 0.3
+num_train_epochs:
+  desc: null
+  value: 5
+max_steps:
+  desc: null
+  value: 20000
+lr_scheduler_type:
+  desc: null
+  value: cosine
+lr_scheduler_kwargs:
+  desc: null
+  value: {}
+warmup_ratio:
+  desc: null
+  value: 0.03
+warmup_steps:
+  desc: null
+  value: 0
+log_level:
+  desc: null
+  value: passive
+log_level_replica:
+  desc: null
+  value: warning
+log_on_each_node:
+  desc: null
+  value: true
+logging_dir:
+  desc: null
+  value: /kaggle/working/runs/Apr11_04-07-17_321ddc84c049
+logging_strategy:
+  desc: null
+  value: steps
+logging_first_step:
+  desc: null
+  value: false
+logging_steps:
+  desc: null
+  value: 20
+logging_nan_inf_filter:
+  desc: null
+  value: true
+save_strategy:
+  desc: null
+  value: steps
+save_steps:
+  desc: null
+  value: 20
+save_total_limit:
+  desc: null
+  value: 1
+save_safetensors:
+  desc: null
+  value: true
+save_on_each_node:
+  desc: null
+  value: false
+save_only_model:
+  desc: null
+  value: false
+no_cuda:
+  desc: null
+  value: false
+use_cpu:
+  desc: null
+  value: false
+use_mps_device:
+  desc: null
+  value: false
+seed:
+  desc: null
+  value: 42
+data_seed:
+  desc: null
+  value: null
+jit_mode_eval:
+  desc: null
+  value: false
+use_ipex:
+  desc: null
+  value: false
+bf16:
+  desc: null
+  value: false
+fp16:
+  desc: null
+  value: false
+fp16_opt_level:
+  desc: null
+  value: O1
+half_precision_backend:
+  desc: null
+  value: auto
+bf16_full_eval:
+  desc: null
+  value: false
+fp16_full_eval:
+  desc: null
+  value: false
+tf32:
+  desc: null
+  value: null
+local_rank:
+  desc: null
+  value: 0
+ddp_backend:
+  desc: null
+  value: null
+tpu_num_cores:
+  desc: null
+  value: null
+tpu_metrics_debug:
+  desc: null
+  value: false
+debug:
+  desc: null
+  value: []
+dataloader_drop_last:
+  desc: null
+  value: false
+eval_steps:
+  desc: null
+  value: null
+dataloader_num_workers:
+  desc: null
+  value: 8
+dataloader_prefetch_factor:
+  desc: null
+  value: null
+past_index:
+  desc: null
+  value: -1
+run_name:
+  desc: null
+  value: /kaggle/working/
+disable_tqdm:
+  desc: null
+  value: false
+remove_unused_columns:
+  desc: null
+  value: true
+label_names:
+  desc: null
+  value: null
+load_best_model_at_end:
+  desc: null
+  value: false
+metric_for_best_model:
+  desc: null
+  value: null
+greater_is_better:
+  desc: null
+  value: null
+ignore_data_skip:
+  desc: null
+  value: false
+fsdp:
+  desc: null
+  value: []
+fsdp_min_num_params:
+  desc: null
+  value: 0
+fsdp_config:
+  desc: null
+  value:
+    min_num_params: 0
+    xla: false
+    xla_fsdp_v2: false
+    xla_fsdp_grad_ckpt: false
+fsdp_transformer_layer_cls_to_wrap:
+  desc: null
+  value: null
+accelerator_config:
+  desc: null
+  value:
+    split_batches: false
+    dispatch_batches: null
+    even_batches: true
+    use_seedable_sampler: true
+deepspeed:
+  desc: null
+  value: null
+label_smoothing_factor:
+  desc: null
+  value: 0.0
+optim:
+  desc: null
+  value: paged_adamw_32bit
+optim_args:
+  desc: null
+  value: null
+adafactor:
+  desc: null
+  value: false
+group_by_length:
+  desc: null
+  value: false
+length_column_name:
+  desc: null
+  value: length
+report_to:
+  desc: null
+  value:
+  - tensorboard
+  - wandb
+ddp_find_unused_parameters:
+  desc: null
+  value: null
+ddp_bucket_cap_mb:
+  desc: null
+  value: null
+ddp_broadcast_buffers:
+  desc: null
+  value: null
+dataloader_pin_memory:
+  desc: null
+  value: true
+dataloader_persistent_workers:
+  desc: null
+  value: false
+skip_memory_metrics:
+  desc: null
+  value: true
+use_legacy_prediction_loop:
+  desc: null
+  value: false
+push_to_hub:
+  desc: null
+  value: false
+resume_from_checkpoint:
+  desc: null
+  value: null
+hub_model_id:
+  desc: null
+  value: null
+hub_strategy:
+  desc: null
+  value: every_save
+hub_token:
+  desc: null
+  value: <HUB_TOKEN>
+hub_private_repo:
+  desc: null
+  value: false
+hub_always_push:
+  desc: null
+  value: false
+gradient_checkpointing:
+  desc: null
+  value: true
+gradient_checkpointing_kwargs:
+  desc: null
+  value: null
+include_inputs_for_metrics:
+  desc: null
+  value: false
+fp16_backend:
+  desc: null
+  value: auto
+push_to_hub_model_id:
+  desc: null
+  value: null
+push_to_hub_organization:
+  desc: null
+  value: null
+push_to_hub_token:
+  desc: null
+  value: <PUSH_TO_HUB_TOKEN>
+mp_parameters:
+  desc: null
+  value: ''
+auto_find_batch_size:
+  desc: null
+  value: true
+full_determinism:
+  desc: null
+  value: false
+torchdynamo:
+  desc: null
+  value: null
+ray_scope:
+  desc: null
+  value: last
+ddp_timeout:
+  desc: null
+  value: 1800
+torch_compile:
+  desc: null
+  value: false
+torch_compile_backend:
+  desc: null
+  value: null
+torch_compile_mode:
+  desc: null
+  value: null
+dispatch_batches:
+  desc: null
+  value: null
+split_batches:
+  desc: null
+  value: null
+include_tokens_per_second:
+  desc: null
+  value: false
+include_num_input_tokens_seen:
+  desc: null
+  value: false
+neftune_noise_alpha:
+  desc: null
+  value: null
+optim_target_modules:
+  desc: null
+  value: null

wandb/run-20240411_040722-rimyh9a1/files/output.log ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/run-20240411_040722-rimyh9a1/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,864 @@

+Babel==2.14.0
+Boruta==0.3
+Brotli==1.0.9
+CVXcanon==0.1.2
+Cartopy==0.22.0
+Cython==3.0.8
+Deprecated==1.2.14
+Farama-Notifications==0.0.4
+Flask==3.0.2
+Geohash==1.0
+GitPython==3.1.41
+ImageHash==4.3.1
+Janome==0.5.0
+Jinja2==3.1.2
+LunarCalendar==0.0.9
+Mako==1.3.2
+Markdown==3.5.2
+MarkupSafe==2.1.3
+MarkupSafe==2.1.5
+Pillow==9.5.0
+PuLP==2.8.0
+PyArabic==0.6.15
+PyJWT==2.8.0
+PyMeeus==0.5.12
+PySocks==1.7.1
+PyUpSet==0.1.1.post7
+PyWavelets==1.5.0
+PyYAML==6.0.1
+Pygments==2.17.2
+Pympler==1.0.1
+QtPy==2.4.1
+Rtree==1.2.0
+SQLAlchemy==2.0.25
+SecretStorage==3.3.3
+Send2Trash==1.8.2
+Shapely==1.8.5.post1
+Shimmy==1.3.0
+SimpleITK==2.3.1
+TPOT==0.12.1
+Theano-PyMC==1.1.2
+Theano==1.0.5
+Wand==0.6.13
+Werkzeug==3.0.2
+absl-py==1.4.0
+accelerate==0.28.0
+access==1.1.9
+affine==2.4.0
+aiobotocore==2.12.2
+aiofiles==22.1.0
+aiohttp-cors==0.7.0
+aiohttp==3.9.1
+aioitertools==0.11.0
+aiorwlock==1.3.0
+aiosignal==1.3.1
+aiosqlite==0.19.0
+albumentations==1.4.0
+alembic==1.13.1
+altair==5.3.0
+annotated-types==0.6.0
+annoy==1.17.3
+anyio==4.2.0
+apache-beam==2.46.0
+aplus==0.11.0
+appdirs==1.4.4
+archspec==0.2.3
+argon2-cffi-bindings==21.2.0
+argon2-cffi==23.1.0
+array-record==0.5.0
+arrow==1.3.0
+arviz==0.17.1
+astroid==3.1.0
+astropy-iers-data==0.2024.4.1.0.33.14
+astropy==6.0.1
+asttokens==2.4.1
+astunparse==1.6.3
+async-lru==2.0.4
+async-timeout==4.0.3
+attrs==23.2.0
+audioread==3.0.1
+autopep8==2.0.4
+backoff==2.2.1
+bayesian-optimization==1.4.3
+beatrix_jupyterlab==2023.128.151533
+beautifulsoup4==4.12.2
+bitsandbytes==0.43.0
+blake3==0.2.1
+bleach==6.1.0
+blessed==1.20.0
+blinker==1.7.0
+blis==0.7.10
+blosc2==2.6.0
+bokeh==3.3.4
+boltons==23.1.1
+boto3==1.26.100
+botocore==1.34.51
+bq_helper==0.4.1
+bqplot==0.12.43
+branca==0.7.1
+brewer2mpl==1.4.1
+brotlipy==0.7.0
+cached-property==1.5.2
+cachetools==4.2.4
+cachetools==5.3.2
+catalogue==2.0.10
+catalyst==22.4
+catboost==1.2.3
+category-encoders==2.6.3
+certifi==2024.2.2
+cesium==0.12.1
+cffi==1.16.0
+charset-normalizer==3.3.2
+chex==0.1.86
+cleverhans==4.0.0
+click-plugins==1.1.1
+click==8.1.7
+cligj==0.7.2
+cloud-tpu-client==0.10
+cloud-tpu-profiler==2.4.0
+cloudpathlib==0.16.0
+cloudpickle==2.2.1
+cloudpickle==3.0.0
+cmdstanpy==1.2.2
+colorama==0.4.6
+colorcet==3.1.0
+colorful==0.5.6
+colorlog==6.8.2
+colorlover==0.3.0
+comm==0.2.1
+conda-libmamba-solver==23.7.0
+conda-package-handling==2.2.0
+conda==23.7.4
+conda_package_streaming==0.9.0
+confection==0.1.4
+contextily==1.6.0
+contourpy==1.2.0
+convertdate==2.4.0
+crcmod==1.7
+cryptography==41.0.7
+cuda-python==12.4.0
+cudf==23.8.0
+cufflinks==0.17.3
+cuml==23.8.0
+cupy==13.0.0
+cycler==0.12.1
+cymem==2.0.8
+cytoolz==0.12.3
+daal4py==2024.2.0
+daal==2024.2.0
+dacite==1.8.1
+dask-cuda==23.8.0
+dask-cudf==23.8.0
+dask-expr==1.0.9
+dask==2024.4.0
+dataclasses-json==0.6.4
+dataproc_jupyter_plugin==0.1.66
+datasets==2.16.0
+datashader==0.16.0
+datatile==1.0.3
+db-dtypes==1.2.0
+deap==1.4.1
+debugpy==1.8.0
+decorator==5.1.1
+deepdiff==6.7.1
+defusedxml==0.7.1
+deprecation==2.1.0
+descartes==1.1.0
+dill==0.3.7
+dipy==1.9.0
+distlib==0.3.8
+distributed==2023.7.1
+distro==1.9.0
+dm-tree==0.1.8
+docker-pycreds==0.4.0
+docker==7.0.0
+docopt==0.6.2
+docstring-parser==0.15
+docstring-to-markdown==0.15
+docutils==0.20.1
+earthengine-api==0.1.395
+easydict==1.13
+easyocr==1.7.1
+ecos==2.0.13
+eli5==0.13.0
+emoji==2.11.0
+en-core-web-lg==3.7.1
+en-core-web-sm==3.7.1
+entrypoints==0.4
+ephem==4.1.5
+esda==2.5.1
+essentia==2.1b6.dev1110
+et-xmlfile==1.1.0
+etils==1.6.0
+exceptiongroup==1.2.0
+executing==2.0.1
+explainable-ai-sdk==1.3.3
+fastai==2.7.14
+fastapi==0.108.0
+fastavro==1.9.3
+fastcore==1.5.29
+fastdownload==0.0.7
+fasteners==0.19
+fastjsonschema==2.19.1
+fastprogress==1.0.3
+fastrlock==0.8.2
+fasttext==0.9.2
+feather-format==0.4.1
+featuretools==1.30.0
+filelock==3.13.1
+fiona==1.9.6
+fitter==1.7.0
+flake8==7.0.0
+flashtext==2.7
+flatbuffers==23.5.26
+flax==0.8.2
+folium==0.16.0
+fonttools==4.47.0
+fonttools==4.50.0
+fqdn==1.5.1
+frozendict==2.4.1
+frozenlist==1.4.1
+fsspec==2023.10.0
+fsspec==2024.3.1
+funcy==2.0
+fury==0.10.0
+future==1.0.0
+fuzzywuzzy==0.18.0
+gast==0.5.4
+gatspy==0.3
+gcsfs==2024.2.0
+gensim==4.3.2
+geographiclib==2.0
+geojson==3.1.0
+geopandas==0.14.3
+geoplot==0.5.1
+geopy==2.4.1
+geoviews==1.11.1
+ggplot==0.11.5
+giddy==2.3.5
+gitdb==4.0.11
+google-ai-generativelanguage==0.4.0
+google-api-core==2.11.1
+google-api-core==2.18.0
+google-api-python-client==2.125.0
+google-apitools==0.5.31
+google-auth-httplib2==0.2.0
+google-auth-oauthlib==1.2.0
+google-auth==2.26.1
+google-cloud-aiplatform==0.6.0a1
+google-cloud-artifact-registry==1.10.0
+google-cloud-automl==1.0.1
+google-cloud-bigquery==2.34.4
+google-cloud-bigtable==1.7.3
+google-cloud-core==2.4.1
+google-cloud-datastore==2.19.0
+google-cloud-dlp==3.14.0
+google-cloud-jupyter-config==0.0.5
+google-cloud-language==2.13.3
+google-cloud-monitoring==2.18.0
+google-cloud-pubsub==2.19.0
+google-cloud-pubsublite==1.9.0
+google-cloud-recommendations-ai==0.7.1
+google-cloud-resource-manager==1.11.0
+google-cloud-spanner==3.40.1
+google-cloud-storage==1.44.0
+google-cloud-translate==3.12.1
+google-cloud-videointelligence==2.13.3
+google-cloud-vision==2.8.0
+google-crc32c==1.5.0
+google-generativeai==0.4.1
+google-pasta==0.2.0
+google-resumable-media==2.7.0
+googleapis-common-protos==1.62.0
+gplearn==0.4.2
+gpustat==1.0.0
+gpxpy==1.6.2
+graphviz==0.20.3
+greenlet==3.0.3
+grpc-google-iam-v1==0.12.7
+grpcio-status==1.48.1
+grpcio-status==1.48.2
+grpcio==1.51.1
+grpcio==1.60.0
+gviz-api==1.10.0
+gym-notices==0.0.8
+gym==0.26.2
+gymnasium==0.29.0
+h11==0.14.0
+h2o==3.46.0.1
+h5netcdf==1.3.0
+h5py==3.10.0
+haversine==2.8.1
+hdfs==2.7.3
+hep-ml==0.7.2
+hijri-converter==2.3.1
+hmmlearn==0.3.2
+holidays==0.24
+holoviews==1.18.3
+hpsklearn==0.1.0
+html5lib==1.1
+htmlmin==0.1.12
+httpcore==1.0.5
+httplib2==0.21.0
+httptools==0.6.1
+httpx==0.27.0
+huggingface-hub==0.22.2
+hunspell==0.5.5
+hydra-slayer==0.5.0
+hyperopt==0.2.7
+hypertools==0.8.0
+idna==3.6
+igraph==0.11.4
+imagecodecs==2024.1.1
+imageio==2.33.1
+imbalanced-learn==0.12.2
+imgaug==0.4.0
+importlib-metadata==6.11.0
+importlib-metadata==7.0.1
+importlib-resources==6.1.1
+inequality==1.0.1
+iniconfig==2.0.0
+ipydatawidgets==4.3.5
+ipykernel==6.28.0
+ipyleaflet==0.18.2
+ipympl==0.7.0
+ipython-genutils==0.2.0
+ipython-genutils==0.2.0
+ipython-sql==0.5.0
+ipython==8.20.0
+ipyvolume==0.6.3
+ipyvue==1.10.2
+ipyvuetify==1.9.3
+ipywebrtc==0.6.0
+ipywidgets==7.7.1
+isoduration==20.11.0
+isort==5.13.2
+isoweek==1.3.3
+itsdangerous==2.1.2
+jaraco.classes==3.3.0
+jax-jumpy==1.0.0
+jax==0.4.23
+jaxlib==0.4.23.dev20240116
+jedi==0.19.1
+jeepney==0.8.0
+jieba==0.42.1
+jmespath==1.0.1
+joblib==1.3.2
+json5==0.9.14
+jsonpatch==1.33
+jsonpointer==2.4
+jsonschema-specifications==2023.12.1
+jsonschema==4.20.0
+jupyter-console==6.6.3
+jupyter-events==0.9.0
+jupyter-http-over-ws==0.0.8
+jupyter-lsp==1.5.1
+jupyter-server-mathjax==0.2.6
+jupyter-ydoc==0.2.5
+jupyter_client==7.4.9
+jupyter_client==8.6.0
+jupyter_core==5.7.1
+jupyter_server==2.13.0
+jupyter_server_fileid==0.9.1
+jupyter_server_proxy==4.1.0
+jupyter_server_terminals==0.5.1
+jupyter_server_ydoc==0.8.0
+jupyterlab-lsp==5.1.0
+jupyterlab-widgets==3.0.9
+jupyterlab==4.1.5
+jupyterlab_git==0.44.0
+jupyterlab_pygments==0.3.0
+jupyterlab_server==2.25.2
+jupytext==1.16.0
+kaggle-environments==1.14.3
+kaggle==1.6.8
+kagglehub==0.2.2
+keras-cv==0.8.2
+keras-nlp==0.8.2
+keras-tuner==1.4.6
+keras==3.1.1
+kernels-mixer==0.0.7
+keyring==24.3.0
+keyrings.google-artifactregistry-auth==1.1.2
+kfp-pipeline-spec==0.2.2
+kfp-server-api==2.0.5
+kfp==2.5.0
+kiwisolver==1.4.5
+kmapper==2.0.1
+kmodes==0.12.2
+korean-lunar-calendar==0.3.1
+kornia==0.7.2
+kornia_rs==0.1.3
+kt-legacy==1.0.5
+kubernetes==26.1.0
+langcodes==3.3.0
+langid==1.1.6
+lazy_loader==0.3
+learntools==0.3.4
+leven==1.0.4
+libclang==16.0.6
+libmambapy==1.5.0
+libpysal==4.9.2
+librosa==0.10.1
+lightgbm==4.2.0
+lightning-utilities==0.11.2
+lime==0.2.0.1
+line-profiler==4.1.2
+linkify-it-py==2.0.3
+llvmlite==0.41.1
+llvmlite==0.42.0
+lml==0.1.0
+locket==1.0.0
+loguru==0.7.2
+lxml==5.2.1
+lz4==4.3.3
+mamba==1.5.0
+mapclassify==2.6.1
+markdown-it-py==3.0.0
+marshmallow==3.21.1
+matplotlib-inline==0.1.6
+matplotlib-venn==0.11.10
+matplotlib==3.7.5
+matplotlib==3.8.3
+mccabe==0.7.0
+mdit-py-plugins==0.4.0
+mdurl==0.1.2
+memory-profiler==0.61.0
+menuinst==2.0.1
+mercantile==1.2.1
+mgwr==2.2.1
+missingno==0.5.2
+mistune==0.8.4
+mizani==0.11.1
+ml-dtypes==0.2.0
+mlcrate==0.2.0
+mlens==0.2.3
+mlxtend==0.23.1
+mne==1.6.1
+mnist==0.2.2
+momepy==0.7.0
+more-itertools==10.2.0
+mpld3==0.5.10
+mpmath==1.3.0
+msgpack==1.0.7
+multidict==6.0.4
+multimethod==1.10
+multipledispatch==1.0.0
+multiprocess==0.70.15
+munkres==1.1.4
+murmurhash==1.0.10
+mypy-extensions==1.0.0
+namex==0.0.7
+nb-conda-kernels==2.3.1
+nb_conda==2.2.1
+nbclassic==1.0.0
+nbclient==0.5.13
+nbconvert==6.4.5
+nbdime==3.2.0
+nbformat==5.9.2
+ndindex==1.8
+nest-asyncio==1.5.8
+networkx==3.2.1
+nibabel==5.2.1
+nilearn==0.10.3
+ninja==1.11.1.1
+nltk==3.2.4
+nose==1.3.7
+notebook==6.5.4
+notebook==6.5.6
+notebook_executor==0.2
+notebook_shim==0.2.3
+numba==0.58.1
+numba==0.59.1
+numexpr==2.10.0
+numpy==1.26.4
+nvidia-ml-py==11.495.46
+nvtx==0.2.10
+oauth2client==4.1.3
+oauthlib==3.2.2
+objsize==0.6.1
+odfpy==1.4.1
+olefile==0.47
+onnx==1.16.0
+opencensus-context==0.1.3
+opencensus==0.11.4
+opencv-contrib-python==4.9.0.80
+opencv-python-headless==4.9.0.80
+opencv-python==4.9.0.80
+openpyxl==3.1.2
+openslide-python==1.3.1
+opentelemetry-api==1.22.0
+opentelemetry-exporter-otlp-proto-common==1.22.0
+opentelemetry-exporter-otlp-proto-grpc==1.22.0
+opentelemetry-exporter-otlp-proto-http==1.22.0
+opentelemetry-exporter-otlp==1.22.0
+opentelemetry-proto==1.22.0
+opentelemetry-sdk==1.22.0
+opentelemetry-semantic-conventions==0.43b0
+opt-einsum==3.3.0
+optax==0.2.2
+optree==0.11.0
+optuna==3.6.1
+orbax-checkpoint==0.5.7
+ordered-set==4.1.0
+orjson==3.9.10
+ortools==9.4.1874
+osmnx==1.9.2
+overrides==7.4.0
+packaging==21.3
+pandas-datareader==0.10.0
+pandas-profiling==3.6.6
+pandas-summary==0.2.0
+pandas==2.1.4
+pandas==2.2.1
+pandasql==0.7.3
+pandocfilters==1.5.0
+panel==1.3.8
+papermill==2.5.0
+param==2.1.0
+parso==0.8.3
+partd==1.4.1
+path.py==12.5.0
+path==16.10.0
+pathos==0.3.2
+pathy==0.10.3
+patsy==0.5.6
+pdf2image==1.17.0
+peft==0.10.0
+pettingzoo==1.24.0
+pexpect==4.8.0
+pexpect==4.9.0
+phik==0.12.4
+pickleshare==0.7.5
+pillow==10.3.0
+pip==23.3.2
+pkgutil_resolve_name==1.3.10
+platformdirs==4.2.0
+plotly-express==0.4.1
+plotly==5.18.0
+plotnine==0.13.4
+pluggy==1.4.0
+pointpats==2.4.0
+polars==0.20.18
+polyglot==16.7.4
+pooch==1.8.1
+pox==0.3.4
+ppca==0.0.4
+ppft==1.7.6.8
+preprocessing==0.1.13
+preshed==3.0.9
+prettytable==3.9.0
+progressbar2==4.4.2
+prometheus-client==0.19.0
+promise==2.3
+prompt-toolkit==3.0.42
+prompt-toolkit==3.0.43
+prophet==1.1.1
+proto-plus==1.23.0
+protobuf==3.20.3
+protobuf==4.21.12
+psutil==5.9.3
+psutil==5.9.7
+ptyprocess==0.7.0
+pudb==2024.1
+pure-eval==0.2.2
+py-cpuinfo==9.0.0
+py-spy==0.3.14
+py4j==0.10.9.7
+pyLDAvis==3.4.1
+pyOpenSSL==23.3.0
+pyaml==23.12.0
+pyarrow-hotfix==0.6
+pyarrow==15.0.2
+pyasn1-modules==0.3.0
+pyasn1==0.5.1
+pybind11==2.12.0
+pyclipper==1.3.0.post5
+pycodestyle==2.11.1
+pycosat==0.6.6
+pycparser==2.21
+pycryptodome==3.20.0
+pyct==0.5.0
+pycuda==2024.1
+pydantic==2.5.3
+pydantic==2.6.4
+pydantic_core==2.14.6
+pydantic_core==2.16.3
+pydegensac==0.1.2
+pydicom==2.4.4
+pydocstyle==6.3.0
+pydot==1.4.2
+pydub==0.25.1
+pyemd==1.0.0
+pyerfa==2.0.1.1
+pyexcel-io==0.6.6
+pyexcel-ods==0.6.0
+pyflakes==3.2.0
+pygltflib==1.16.2
+pykalman==0.9.7
+pylibraft==23.8.0
+pylint==3.1.0
+pymc3==3.11.4
+pymongo==3.13.0
+pynndescent==0.5.12
+pynvml==11.4.1
+pynvrtc==9.2
+pyparsing==3.1.1
+pyparsing==3.1.2
+pypdf==4.1.0
+pyproj==3.6.1
+pysal==24.1
+pyshp==2.3.1
+pytesseract==0.3.10
+pytest==8.1.1
+python-bidi==0.4.2
+python-dateutil==2.9.0.post0
+python-dotenv==1.0.0
+python-json-logger==2.0.7
+python-louvain==0.16
+python-lsp-jsonrpc==1.1.2
+python-lsp-server==1.11.0
+python-slugify==8.0.4
+python-utils==3.8.2
+pythreejs==2.4.2
+pytoolconfig==1.3.1
+pytools==2024.1.1
+pytorch-ignite==0.5.0.post2
+pytorch-lightning==2.2.1
+pytz==2023.3.post1
+pytz==2024.1
+pyu2f==0.1.5
+pyviz_comms==3.0.2
+pyzmq==24.0.1
+pyzmq==25.1.2
+qgrid==1.3.1
+qtconsole==5.5.1
+quantecon==0.7.2
+qudida==0.0.4
+raft-dask==23.8.0
+rasterio==1.3.9
+rasterstats==0.19.0
+ray-cpp==2.9.0
+ray==2.9.0
+referencing==0.32.1
+regex==2023.12.25
+requests-oauthlib==1.3.1
+requests-toolbelt==0.10.1
+requests==2.31.0
+retrying==1.3.3
+retrying==1.3.4
+rfc3339-validator==0.1.4
+rfc3986-validator==0.1.1
+rgf-python==3.12.0
+rich-click==1.7.4
+rich==13.7.0
+rich==13.7.1
+rmm==23.8.0
+rope==1.13.0
+rpds-py==0.16.2
+rsa==4.9
+ruamel-yaml-conda==0.15.100
+ruamel.yaml.clib==0.2.7
+ruamel.yaml==0.17.40
+s2sphere==0.2.5
+s3fs==2024.2.0
+s3transfer==0.6.2
+safetensors==0.4.2
+scattertext==0.1.19
+scikit-image==0.22.0
+scikit-learn-intelex==2024.2.0
+scikit-learn==1.2.2
+scikit-multilearn==0.2.0
+scikit-optimize==0.10.1
+scikit-plot==0.3.7
+scikit-surprise==1.1.3
+scipy==1.11.4
+scipy==1.12.0
+seaborn==0.12.2
+segment_anything==1.0
+segregation==2.5
+semver==3.0.2
+sentencepiece==0.2.0
+sentry-sdk==1.44.1
+setproctitle==1.3.3
+setuptools-git==1.2
+setuptools-scm==8.0.4
+setuptools==69.0.3
+shap==0.44.1
+shapely==2.0.3
+shellingham==1.5.4
+shtab==1.7.1
+simpervisor==1.0.0
+simplejson==3.19.2
+six==1.16.0
+sklearn-pandas==2.2.0
+slicer==0.0.7
+smart-open==6.4.0
+smmap==5.0.1
+sniffio==1.3.0
+snowballstemmer==2.2.0
+snuggs==1.4.7
+sortedcontainers==2.4.0
+soundfile==0.12.1
+soupsieve==2.5
+soxr==0.3.7
+spacy-legacy==3.0.12
+spacy-loggers==1.0.5
+spacy==3.7.2
+spaghetti==1.7.5.post1
+spectral==0.23.1
+spglm==1.1.0
+sphinx-rtd-theme==0.2.4
+spint==1.0.7
+splot==1.1.5.post1
+spopt==0.6.0
+spreg==1.4.2
+spvcm==0.3.0
+sqlparse==0.4.4
+squarify==0.4.3
+srsly==2.4.8
+stable-baselines3==2.1.0
+stack-data==0.6.2
+stack-data==0.6.3
+stanio==0.5.0
+starlette==0.32.0.post1
+statsmodels==0.14.1
+stemming==1.0.1
+stop-words==2018.7.23
+stopit==1.1.2
+stumpy==1.12.0
+sympy==1.12
+tables==3.9.2
+tabulate==0.9.0
+tangled-up-in-unicode==0.2.0
+tbb==2021.12.0
+tblib==3.0.0
+tenacity==8.2.3
+tensorboard-data-server==0.7.2
+tensorboard-plugin-profile==2.15.0
+tensorboard==2.15.1
+tensorboardX==2.6.2.2
+tensorflow-cloud==0.1.16
+tensorflow-datasets==4.9.4
+tensorflow-decision-forests==1.8.1
+tensorflow-estimator==2.15.0
+tensorflow-hub==0.16.1
+tensorflow-io-gcs-filesystem==0.35.0
+tensorflow-io==0.35.0
+tensorflow-metadata==0.14.0
+tensorflow-probability==0.23.0
+tensorflow-serving-api==2.14.1
+tensorflow-text==2.15.0
+tensorflow-transform==0.14.0
+tensorflow==2.15.0
+tensorstore==0.1.56
+termcolor==2.4.0
+terminado==0.18.0
+testpath==0.6.0
+text-unidecode==1.3
+textblob==0.18.0.post0
+texttable==1.7.0
+tf_keras==2.15.1
+tfp-nightly==0.24.0.dev0
+thinc==8.2.2
+threadpoolctl==3.2.0
+tifffile==2023.12.9
+timm==0.9.16
+tinycss2==1.2.1
+tobler==0.11.2
+tokenizers==0.15.2
+toml==0.10.2
+tomli==2.0.1
+tomlkit==0.12.4
+toolz==0.12.1
+torch==2.1.2
+torchaudio==2.1.2
+torchdata==0.7.1
+torchinfo==1.8.0
+torchmetrics==1.3.2
+torchtext==0.16.2
+torchvision==0.16.2
+tornado==6.3.3
+tqdm==4.66.1
+traceml==1.0.8
+traitlets==5.9.0
+traittypes==0.2.1
+transformers==4.39.3
+treelite-runtime==3.2.0
+treelite==3.2.0
+trl==0.8.1
+truststore==0.8.0
+trx-python==0.2.9
+tsfresh==0.20.2
+typeguard==4.1.5
+typer==0.9.0
+typer==0.9.4
+types-python-dateutil==2.8.19.20240106
+typing-inspect==0.9.0
+typing-utils==0.1.0
+typing_extensions==4.9.0
+tyro==0.8.3
+tzdata==2023.4
+uc-micro-py==1.0.3
+ucx-py==0.33.0
+ujson==5.9.0
+umap-learn==0.5.5
+unicodedata2==15.1.0
+update-checker==0.18.0
+uri-template==1.3.0
+uritemplate==3.0.1
+urllib3==1.26.18
+urllib3==2.1.0
+urwid==2.6.10
+urwid_readline==0.14
+uvicorn==0.25.0
+uvloop==0.19.0
+vaex-astro==0.9.3
+vaex-core==4.17.1
+vaex-hdf5==0.14.1
+vaex-jupyter==0.8.2
+vaex-ml==0.18.3
+vaex-server==0.9.0
+vaex-viz==0.5.4
+vaex==4.17.0
+vec_noise==1.1.4
+vecstack==0.4.0
+virtualenv==20.21.0
+visions==0.7.5
+vowpalwabbit==9.9.0
+vtk==9.3.0
+wandb==0.16.5
+wasabi==1.1.2
+watchfiles==0.21.0
+wavio==0.0.8
+wcwidth==0.2.13
+weasel==0.3.4
+webcolors==1.13
+webencodings==0.5.1
+websocket-client==1.7.0
+websockets==12.0
+wfdb==4.1.2
+whatthepatch==1.0.5
+wheel==0.42.0
+widgetsnbextension==3.6.6
+witwidget==1.8.1
+woodwork==0.29.0
+wordcloud==1.9.3
+wordsegment==1.3.1
+wrapt==1.14.1
+xarray-einstats==0.7.0
+xarray==2024.3.0
+xgboost==2.0.3
+xvfbwrapper==0.2.9
+xxhash==3.4.1
+xyzservices==2023.10.1
+y-py==0.6.2
+yapf==0.40.2
+yarl==1.9.3
+yarl==1.9.4
+ydata-profiling==4.6.4
+yellowbrick==1.5
+ypy-websocket==0.8.4
+zict==3.0.0
+zipp==3.17.0
+zstandard==0.22.0

wandb/run-20240411_040722-rimyh9a1/files/wandb-metadata.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+    "os": "Linux-5.15.133+-x86_64-with-glibc2.31",
+    "python": "3.10.13",
+    "heartbeatAt": "2024-04-11T04:07:23.361534",
+    "startedAt": "2024-04-11T04:07:22.840819",
+    "docker": null,
+    "cuda": null,
+    "args": [],
+    "state": "running",
+    "program": "kaggle.ipynb",
+    "codePathLocal": null,
+    "root": "/kaggle/working",
+    "host": "321ddc84c049",
+    "username": "root",
+    "executable": "/opt/conda/bin/python3.10",
+    "cpu_count": 2,
+    "cpu_count_logical": 4,
+    "cpu_freq": {
+        "current": 2000.19,
+        "min": 0.0,
+        "max": 0.0
+    },
+    "cpu_freq_per_core": [
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2000.19,
+            "min": 0.0,
+            "max": 0.0
+        }
+    ],
+    "disk": {
+        "/": {
+            "total": 8062.387607574463,
+            "used": 5566.962131500244
+        }
+    },
+    "gpu": "Tesla T4",
+    "gpu_count": 2,
+    "gpu_devices": [
+        {
+            "name": "Tesla T4",
+            "memory_total": 16106127360
+        },
+        {
+            "name": "Tesla T4",
+            "memory_total": 16106127360
+        }
+    ],
+    "memory": {
+        "total": 31.357559204101562
+    }
+}

wandb/run-20240411_040722-rimyh9a1/files/wandb-summary.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"train/loss": 3.4153, "train/grad_norm": 0.0, "train/learning_rate": 0.0, "train/epoch": 0.09, "train/global_step": 20000, "_timestamp": 1712827654.7326186, "_runtime": 19211.883972644806, "_step": 1006, "train_runtime": 18957.1753, "train_samples_per_second": 2.11, "train_steps_per_second": 1.055, "total_flos": 1.0807103426248704e+16, "train_loss": 3.9423419631004335}

wandb/run-20240411_040722-rimyh9a1/logs/debug-internal.log ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/run-20240411_040722-rimyh9a1/logs/debug.log ADDED Viewed

	@@ -0,0 +1,31 @@

+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Configure stats pid to 1050
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Loading settings from /kaggle/working/wandb/settings
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program': '<python with no main file>'}
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_setup.py:_flush():76] Applying login settings: {}
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_init.py:_log_setup():527] Logging user logs to /kaggle/working/wandb/run-20240411_040722-rimyh9a1/logs/debug.log
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_init.py:_log_setup():528] Logging internal logs to /kaggle/working/wandb/run-20240411_040722-rimyh9a1/logs/debug-internal.log
+2024-04-11 04:07:22,843 INFO    MainThread:1050 [wandb_init.py:_jupyter_setup():473] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7d563f5f5120>
+2024-04-11 04:07:22,844 INFO    MainThread:1050 [wandb_init.py:init():567] calling init triggers
+2024-04-11 04:07:22,844 INFO    MainThread:1050 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
+config: {}
+2024-04-11 04:07:22,844 INFO    MainThread:1050 [wandb_init.py:init():617] starting backend
+2024-04-11 04:07:22,844 INFO    MainThread:1050 [wandb_init.py:init():621] setting up manager
+2024-04-11 04:07:22,847 INFO    MainThread:1050 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-04-11 04:07:22,848 INFO    MainThread:1050 [wandb_init.py:init():629] backend started and connected
+2024-04-11 04:07:22,865 INFO    MainThread:1050 [wandb_run.py:_label_probe_notebook():1299] probe notebook
+2024-04-11 04:07:23,106 INFO    MainThread:1050 [wandb_init.py:init():721] updated telemetry
+2024-04-11 04:07:23,108 INFO    MainThread:1050 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
+2024-04-11 04:07:23,235 INFO    MainThread:1050 [wandb_run.py:_on_init():2344] communicating current version
+2024-04-11 04:07:23,323 INFO    MainThread:1050 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.16.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2024-04-11 04:07:23,324 INFO    MainThread:1050 [wandb_init.py:init():805] starting run threads in backend
+2024-04-11 04:07:39,317 INFO    MainThread:1050 [wandb_run.py:_console_start():2323] atexit reg
+2024-04-11 04:07:39,317 INFO    MainThread:1050 [wandb_run.py:_redirect():2178] redirect: wrap_raw
+2024-04-11 04:07:39,318 INFO    MainThread:1050 [wandb_run.py:_redirect():2243] Wrapping output streams.
+2024-04-11 04:07:39,318 INFO    MainThread:1050 [wandb_run.py:_redirect():2268] Redirects installed.
+2024-04-11 04:07:39,319 INFO    MainThread:1050 [wandb_init.py:init():848] run started, returning control to user process
+2024-04-11 04:07:39,324 INFO    MainThread:1050 [wandb_run.py:_config_callback():1347] config_cb None None {'vocab_size': 250880, 'hidden_size': 1024, 'n_layer': 24, 'n_head': 16, 'layer_norm_epsilon': 1e-05, 'initializer_range': 0.02, 'use_cache': False, 'pretraining_tp': 1, 'apply_residual_connection_post_layernorm': False, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'bos_token_id': 1, 'eos_token_id': 2, 'slow_but_exact': False, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['BloomForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'pad_token_id': 3, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'bigscience/bloomz-560m', 'transformers_version': '4.39.3', 'attention_softmax_in_fp32': True, 'bias_dropout_fusion': True, 'unk_token_id': 0, 'masked_softmax_fusion': True, 'model_type': 'bloom', 'n_inner': None, 'offset_alibi': 100, 'seq_length': 2048, 'skip_bias_add': True, 'skip_bias_add_qkv': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': False, '_load_in_4bit': True, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'nf4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float16', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': True, 'load_in_8bit': False}, 'output_dir': '/kaggle/working/', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'evaluation_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'learning_rate': 3e-05, 'weight_decay': 0.001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 5, 'max_steps': 20000, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/kaggle/working/runs/Apr11_04-07-17_321ddc84c049', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 20, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': 1, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 8, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '/kaggle/working/', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_32bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard', 'wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None}