lleticiasilvaa commited on
Commit
54cf148
·
verified ·
1 Parent(s): db1307d

Training in progress, step 1250

Browse files
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
  base_model: stabilityai/stable-code-instruct-3b
3
  library_name: transformers
4
- model_name: StableCode-schemaLinking-min
5
  tags:
6
  - generated_from_trainer
7
  - trl
@@ -9,7 +9,7 @@ tags:
9
  licence: license
10
  ---
11
 
12
- # Model Card for StableCode-schemaLinking-min
13
 
14
  This model is a fine-tuned version of [stabilityai/stable-code-instruct-3b](https://huggingface.co/stabilityai/stable-code-instruct-3b).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
@@ -20,24 +20,25 @@ It has been trained using [TRL](https://github.com/huggingface/trl).
20
  from transformers import pipeline
21
 
22
  question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
23
- generator = pipeline("text-generation", model="lleticiasilvaa/StableCode-schemaLinking-min", device="cuda")
24
  output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
25
  print(output["generated_text"])
26
  ```
27
 
28
  ## Training procedure
29
 
 
30
 
31
 
32
  This model was trained with SFT.
33
 
34
  ### Framework versions
35
 
36
- - TRL: 0.12.1
37
- - Transformers: 4.46.2
38
  - Pytorch: 2.5.1+cu121
39
- - Datasets: 3.1.0
40
- - Tokenizers: 0.20.3
41
 
42
  ## Citations
43
 
 
1
  ---
2
  base_model: stabilityai/stable-code-instruct-3b
3
  library_name: transformers
4
+ model_name: StableCode-text2SQL-alias-indentacao
5
  tags:
6
  - generated_from_trainer
7
  - trl
 
9
  licence: license
10
  ---
11
 
12
+ # Model Card for StableCode-text2SQL-alias-indentacao
13
 
14
  This model is a fine-tuned version of [stabilityai/stable-code-instruct-3b](https://huggingface.co/stabilityai/stable-code-instruct-3b).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
 
20
  from transformers import pipeline
21
 
22
  question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
23
+ generator = pipeline("text-generation", model="lleticiasilvaa/StableCode-text2SQL-alias-indentacao", device="cuda")
24
  output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
25
  print(output["generated_text"])
26
  ```
27
 
28
  ## Training procedure
29
 
30
+
31
 
32
 
33
  This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.13.0
38
+ - Transformers: 4.47.1
39
  - Pytorch: 2.5.1+cu121
40
+ - Datasets: 3.2.0
41
+ - Tokenizers: 0.21.0
42
 
43
  ## Citations
44
 
adapter_config.json CHANGED
@@ -6,6 +6,8 @@
6
  },
7
  "base_model_name_or_path": "stabilityai/stable-code-instruct-3b",
8
  "bias": "none",
 
 
9
  "fan_in_fan_out": false,
10
  "inference_mode": true,
11
  "init_lora_weights": true,
@@ -14,6 +16,7 @@
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
  "lora_alpha": 128,
 
17
  "lora_dropout": 0.1,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
@@ -23,11 +26,11 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "o_proj",
27
  "k_proj",
28
  "gate_proj",
29
- "v_proj",
30
  "q_proj",
 
 
31
  "down_proj",
32
  "up_proj"
33
  ],
 
6
  },
7
  "base_model_name_or_path": "stabilityai/stable-code-instruct-3b",
8
  "bias": "none",
9
+ "eva_config": null,
10
+ "exclude_modules": null,
11
  "fan_in_fan_out": false,
12
  "inference_mode": true,
13
  "init_lora_weights": true,
 
16
  "layers_to_transform": null,
17
  "loftq_config": {},
18
  "lora_alpha": 128,
19
+ "lora_bias": false,
20
  "lora_dropout": 0.1,
21
  "megatron_config": null,
22
  "megatron_core": "megatron.core",
 
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
 
29
  "k_proj",
30
  "gate_proj",
 
31
  "q_proj",
32
+ "v_proj",
33
+ "o_proj",
34
  "down_proj",
35
  "up_proj"
36
  ],
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:262350168617eaaa7a39d6bf9cc74846936b9d116e0a43d43efedab1699dc957
3
  size 400616360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55af33676eaa5df01b237957e91e836041ede0704c4f6ee669ac492731ede268
3
  size 400616360
logs/events.out.tfevents.1731266026.18bcb61f052b.236.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:603b50c83afe5fd04cbf442087a8c12f730a6b0104e001c42e689db89f81fecb
3
+ size 8268
logs/events.out.tfevents.1735923028.1356149f6382.358.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f024c1e2d4631c2b2cba7a7cd69bf12510b023147029fc09c0bd2b4d298bd5c
3
+ size 10670
logs/events.out.tfevents.1736189043.154f07f7b0d9.1770.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:411d2371102f8c8e78ffb5b7931c855affd4e6ceb77b4226bf5ed42c248f1da0
3
+ size 10325
logs/events.out.tfevents.1736193007.154f07f7b0d9.1770.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f9c14789027d905f61df5a045ef15dceff49a4a059ff1afaf2251bf2fb8dc73
3
+ size 6341
logs/events.out.tfevents.1736193779.154f07f7b0d9.1770.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f233a180ed80891f5e42198db98895eb3acfe9e46116c8b28e4185acdac17bd1
3
+ size 7913
logs/events.out.tfevents.1736207773.024f507f3b84.986.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f38703773c7053a3387dfa2f767819615c15bf73f128452b65e5389f4777e554
3
+ size 6339
logs/events.out.tfevents.1736724540.3d43f6dc00ef.359.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5491f5eba601fb491bc3e33c18752cf86552cf9104b7f2df2fc80735c641ea26
3
+ size 5985
logs/events.out.tfevents.1736724591.3d43f6dc00ef.359.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a36c37d07ca62be47d61a7db21b05cd74b1c5c407fdb834d3e25c00bc401c4f
3
+ size 8267
logs/events.out.tfevents.1736732509.3d43f6dc00ef.359.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a157169c228969c7d72156524b5b7972278e1d6002f0918f53e4e61d93f5ded0
3
+ size 6459
tokenizer_config.json CHANGED
@@ -384,6 +384,7 @@
384
  "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = 'You are a helpful assistant.' %}{% endif %}{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{{'<|im_start|>system\n' + system_message + '<|im_end|>\n'}}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
385
  "clean_up_tokenization_spaces": true,
386
  "eos_token": "<|endoftext|>",
 
387
  "map_device": "auto",
388
  "model_max_length": 4096,
389
  "pad_token": "<|endoftext|>",
 
384
  "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = 'You are a helpful assistant.' %}{% endif %}{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{{'<|im_start|>system\n' + system_message + '<|im_end|>\n'}}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
385
  "clean_up_tokenization_spaces": true,
386
  "eos_token": "<|endoftext|>",
387
+ "extra_special_tokens": {},
388
  "map_device": "auto",
389
  "model_max_length": 4096,
390
  "pad_token": "<|endoftext|>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:845388a2b1a6c201d4c35146c609dfa59b0d3daa4b02627dccafbc1634c54a96
3
  size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f46f9705b5aa6860fbd1b30c0b0e53d4152cbbb594d2bede78bf3a0776b44780
3
  size 5560