Training in progress, step 1250

Browse files

Files changed (14) hide show

README.md +8 -7
adapter_config.json +5 -2
adapter_model.safetensors +1 -1
logs/events.out.tfevents.1731266026.18bcb61f052b.236.0 +3 -0
logs/events.out.tfevents.1735923028.1356149f6382.358.0 +3 -0
logs/events.out.tfevents.1736189043.154f07f7b0d9.1770.0 +3 -0
logs/events.out.tfevents.1736193007.154f07f7b0d9.1770.1 +3 -0
logs/events.out.tfevents.1736193779.154f07f7b0d9.1770.2 +3 -0
logs/events.out.tfevents.1736207773.024f507f3b84.986.0 +3 -0
logs/events.out.tfevents.1736724540.3d43f6dc00ef.359.0 +3 -0
logs/events.out.tfevents.1736724591.3d43f6dc00ef.359.1 +3 -0
logs/events.out.tfevents.1736732509.3d43f6dc00ef.359.2 +3 -0
tokenizer_config.json +1 -0
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 base_model: stabilityai/stable-code-instruct-3b
 library_name: transformers
-model_name: StableCode-schemaLinking-min
 tags:
 - generated_from_trainer
 - trl
@@ -9,7 +9,7 @@ tags:
 licence: license
 ---
-# Model Card for StableCode-schemaLinking-min
 This model is a fine-tuned version of [stabilityai/stable-code-instruct-3b](https://huggingface.co/stabilityai/stable-code-instruct-3b).
 It has been trained using [TRL](https://github.com/huggingface/trl).
@@ -20,24 +20,25 @@ It has been trained using [TRL](https://github.com/huggingface/trl).
 from transformers import pipeline
 question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
-generator = pipeline("text-generation", model="lleticiasilvaa/StableCode-schemaLinking-min", device="cuda")
 output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
 print(output["generated_text"])
 ```
 ## Training procedure
 This model was trained with SFT.
 ### Framework versions
-- TRL: 0.12.1
-- Transformers: 4.46.2
 - Pytorch: 2.5.1+cu121
-- Datasets: 3.1.0
-- Tokenizers: 0.20.3
 ## Citations

 ---
 base_model: stabilityai/stable-code-instruct-3b
 library_name: transformers
+model_name: StableCode-text2SQL-alias-indentacao
 tags:
 - generated_from_trainer
 - trl
 licence: license
 ---
+# Model Card for StableCode-text2SQL-alias-indentacao
 This model is a fine-tuned version of [stabilityai/stable-code-instruct-3b](https://huggingface.co/stabilityai/stable-code-instruct-3b).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 from transformers import pipeline
 question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
+generator = pipeline("text-generation", model="lleticiasilvaa/StableCode-text2SQL-alias-indentacao", device="cuda")
 output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
 print(output["generated_text"])
 ```
 ## Training procedure
 This model was trained with SFT.
 ### Framework versions
+- TRL: 0.13.0
+- Transformers: 4.47.1
 - Pytorch: 2.5.1+cu121
+- Datasets: 3.2.0
+- Tokenizers: 0.21.0
 ## Citations

adapter_config.json CHANGED Viewed

@@ -6,6 +6,8 @@
   },
   "base_model_name_or_path": "stabilityai/stable-code-instruct-3b",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
@@ -14,6 +16,7 @@
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 128,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
@@ -23,11 +26,11 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "o_proj",
     "k_proj",
     "gate_proj",
-    "v_proj",
     "q_proj",
     "down_proj",
     "up_proj"
   ],

   },
   "base_model_name_or_path": "stabilityai/stable-code-instruct-3b",
   "bias": "none",
+  "eva_config": null,
+  "exclude_modules": null,
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 128,
+  "lora_bias": false,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "k_proj",
     "gate_proj",
     "q_proj",
+    "v_proj",
+    "o_proj",
     "down_proj",
     "up_proj"
   ],

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:262350168617eaaa7a39d6bf9cc74846936b9d116e0a43d43efedab1699dc957
 size 400616360

 version https://git-lfs.github.com/spec/v1
+oid sha256:55af33676eaa5df01b237957e91e836041ede0704c4f6ee669ac492731ede268
 size 400616360

logs/events.out.tfevents.1731266026.18bcb61f052b.236.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:603b50c83afe5fd04cbf442087a8c12f730a6b0104e001c42e689db89f81fecb
+size 8268

logs/events.out.tfevents.1735923028.1356149f6382.358.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8f024c1e2d4631c2b2cba7a7cd69bf12510b023147029fc09c0bd2b4d298bd5c
+size 10670

logs/events.out.tfevents.1736189043.154f07f7b0d9.1770.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:411d2371102f8c8e78ffb5b7931c855affd4e6ceb77b4226bf5ed42c248f1da0
+size 10325

logs/events.out.tfevents.1736193007.154f07f7b0d9.1770.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f9c14789027d905f61df5a045ef15dceff49a4a059ff1afaf2251bf2fb8dc73
+size 6341

logs/events.out.tfevents.1736193779.154f07f7b0d9.1770.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f233a180ed80891f5e42198db98895eb3acfe9e46116c8b28e4185acdac17bd1
+size 7913

logs/events.out.tfevents.1736207773.024f507f3b84.986.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f38703773c7053a3387dfa2f767819615c15bf73f128452b65e5389f4777e554
+size 6339

logs/events.out.tfevents.1736724540.3d43f6dc00ef.359.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5491f5eba601fb491bc3e33c18752cf86552cf9104b7f2df2fc80735c641ea26
+size 5985

logs/events.out.tfevents.1736724591.3d43f6dc00ef.359.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a36c37d07ca62be47d61a7db21b05cd74b1c5c407fdb834d3e25c00bc401c4f
+size 8267

logs/events.out.tfevents.1736732509.3d43f6dc00ef.359.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a157169c228969c7d72156524b5b7972278e1d6002f0918f53e4e61d93f5ded0
+size 6459

tokenizer_config.json CHANGED Viewed

@@ -384,6 +384,7 @@
   "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = 'You are a helpful assistant.' %}{% endif %}{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{{'<|im_start|>system\n' + system_message + '<|im_end|>\n'}}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|endoftext|>",
   "map_device": "auto",
   "model_max_length": 4096,
   "pad_token": "<|endoftext|>",

   "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = 'You are a helpful assistant.' %}{% endif %}{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{{'<|im_start|>system\n' + system_message + '<|im_end|>\n'}}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|endoftext|>",
+  "extra_special_tokens": {},
   "map_device": "auto",
   "model_max_length": 4096,
   "pad_token": "<|endoftext|>",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:845388a2b1a6c201d4c35146c609dfa59b0d3daa4b02627dccafbc1634c54a96
 size 5560

 version https://git-lfs.github.com/spec/v1
+oid sha256:f46f9705b5aa6860fbd1b30c0b0e53d4152cbbb594d2bede78bf3a0776b44780
 size 5560