thanhdath commited on
Commit
0241d6b
ยท
1 Parent(s): 905d378

Update checkpoint from thanhdath/FINER-SQL-3B-BIRD + add GitHub link (#3)

Browse files

- Update checkpoint from thanhdath/FINER-SQL-3B-BIRD + add GitHub link (9684f35e81de47e77d90683bdee359237b4040a4)
- Replace README with minimal version (GitHub link + citation) (362452528c6fdae9c8a21c5de1041b71a38bad82)

README.md CHANGED
@@ -1,17 +1,13 @@
1
- ---
2
- base_model:
3
- - griffith-bigdata/Qwen-2.5-Coder-3B-SQL-Writer
4
- ---
5
-
6
- # FINER-SQL-3B-BIRD
7
-
8
- Trained from [`griffith-bigdata/Qwen-2.5-Coder-3B-SQL-Writer`](https://huggingface.co/griffith-bigdata/Qwen-2.5-Coder-3B-SQL-Writer) using GRPO with two dense rewards from the FINER-SQL paper:
9
-
10
- ๐Ÿง  Memory Reward โ€” aligns reasoning with verified traces
11
- โš™๏ธ Atomic Reward โ€” measures operation-level SQL overlap
12
-
13
- โœ… 67.5% EX on BIRD when training only on BIRD train dataset; infer on a single 12-24 GB GPU
14
-
15
- ๐Ÿ“„ See other models: https://huggingface.co/collections/griffith-bigdata/finer-sql
16
-
17
- ๐Ÿ“„ Github: https://github.com/thanhdath/finer-sql/tree/main
 
1
+ ๐Ÿ“„ GitHub: https://github.com/thanhdath/finer-sql
2
+
3
+ ## Citation
4
+
5
+ ```bibtex
6
+ @inproceedings{finersql,
7
+ author = {Thanh Dat Hoang and Thanh Trung Huynh and Matthias Weidlich and Thanh Tam Nguyen and Tong Chen and Hongzhi Yin and Quoc Viet Hung Nguyen},
8
+ title = {Boosting Small Language Models for Text-to-SQL with Fine-Grained Execution Feedback and Cost-Efficient Rewards},
9
+ booktitle = {ICDE},
10
+ publisher = {IEEE},
11
+ year = {2026},
12
+ }
13
+ ```
 
 
 
 
config.json CHANGED
@@ -59,7 +59,7 @@
59
  "rope_theta": 1000000.0,
60
  "sliding_window": null,
61
  "tie_word_embeddings": true,
62
- "transformers_version": "4.57.0",
63
  "use_cache": false,
64
  "use_sliding_window": false,
65
  "vocab_size": 151936
 
59
  "rope_theta": 1000000.0,
60
  "sliding_window": null,
61
  "tie_word_embeddings": true,
62
+ "transformers_version": "4.57.3",
63
  "use_cache": false,
64
  "use_sliding_window": false,
65
  "vocab_size": 151936
generation_config.json CHANGED
@@ -9,5 +9,5 @@
9
  "temperature": 0.7,
10
  "top_k": 20,
11
  "top_p": 0.8,
12
- "transformers_version": "4.57.0"
13
  }
 
9
  "temperature": 0.7,
10
  "top_k": 20,
11
  "top_p": 0.8,
12
+ "transformers_version": "4.57.3"
13
  }
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9164dea2c8426fe370018e57fc618e8fec599ab28db5e887a6c94c0c72a25e3a
3
  size 4957560304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee02a3811c46f66e0b9fb703a474b9996ea71d30b822aa900ea3b46c0e609cf1
3
  size 4957560304
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edf6bbb1ddf2cfcd40825761b6153571a0a0b704cbb6302ce2d29a1d9b9fcfec
3
  size 1214366696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb660d6e329abcb9105a8183eb58798c4937d2a33e2e1e2c8ee43fa622fe888e
3
  size 1214366696
tokenizer_config.json CHANGED
@@ -201,12 +201,14 @@
201
  "extra_special_tokens": {},
202
  "max_length": 6192,
203
  "model_max_length": 32768,
 
204
  "pad_token": "<|endoftext|>",
 
205
  "padding_side": "left",
206
  "split_special_tokens": false,
207
  "stride": 0,
208
  "tokenizer_class": "Qwen2Tokenizer",
209
- "truncation_side": "right",
210
  "truncation_strategy": "longest_first",
211
  "unk_token": null
212
  }
 
201
  "extra_special_tokens": {},
202
  "max_length": 6192,
203
  "model_max_length": 32768,
204
+ "pad_to_multiple_of": null,
205
  "pad_token": "<|endoftext|>",
206
+ "pad_token_type_id": 0,
207
  "padding_side": "left",
208
  "split_special_tokens": false,
209
  "stride": 0,
210
  "tokenizer_class": "Qwen2Tokenizer",
211
+ "truncation_side": "left",
212
  "truncation_strategy": "longest_first",
213
  "unk_token": null
214
  }