bobber commited on
Commit
54f3199
·
1 Parent(s): 5243ca7

add checkpoints

Browse files
Files changed (28) hide show
  1. Qwen-0.5B-GRPO/checkpoint-1300/added_tokens.json +3 -0
  2. Qwen-0.5B-GRPO/checkpoint-1300/config.json +3 -0
  3. Qwen-0.5B-GRPO/checkpoint-1300/generation_config.json +3 -0
  4. Qwen-0.5B-GRPO/checkpoint-1300/merges.txt +3 -0
  5. Qwen-0.5B-GRPO/checkpoint-1300/model.safetensors +3 -0
  6. Qwen-0.5B-GRPO/checkpoint-1300/optimizer.pt +3 -0
  7. Qwen-0.5B-GRPO/checkpoint-1300/rng_state.pth +3 -0
  8. Qwen-0.5B-GRPO/checkpoint-1300/scheduler.pt +3 -0
  9. Qwen-0.5B-GRPO/checkpoint-1300/special_tokens_map.json +3 -0
  10. Qwen-0.5B-GRPO/checkpoint-1300/tokenizer.json +3 -0
  11. Qwen-0.5B-GRPO/checkpoint-1300/tokenizer_config.json +3 -0
  12. Qwen-0.5B-GRPO/checkpoint-1300/trainer_state.json +3 -0
  13. Qwen-0.5B-GRPO/checkpoint-1300/training_args.bin +3 -0
  14. Qwen-0.5B-GRPO/checkpoint-1300/vocab.json +3 -0
  15. Qwen-0.5B-GRPO/checkpoint-1400/added_tokens.json +3 -0
  16. Qwen-0.5B-GRPO/checkpoint-1400/config.json +3 -0
  17. Qwen-0.5B-GRPO/checkpoint-1400/generation_config.json +3 -0
  18. Qwen-0.5B-GRPO/checkpoint-1400/merges.txt +3 -0
  19. Qwen-0.5B-GRPO/checkpoint-1400/model.safetensors +3 -0
  20. Qwen-0.5B-GRPO/checkpoint-1400/optimizer.pt +3 -0
  21. Qwen-0.5B-GRPO/checkpoint-1400/rng_state.pth +3 -0
  22. Qwen-0.5B-GRPO/checkpoint-1400/scheduler.pt +3 -0
  23. Qwen-0.5B-GRPO/checkpoint-1400/special_tokens_map.json +3 -0
  24. Qwen-0.5B-GRPO/checkpoint-1400/tokenizer.json +3 -0
  25. Qwen-0.5B-GRPO/checkpoint-1400/tokenizer_config.json +3 -0
  26. Qwen-0.5B-GRPO/checkpoint-1400/trainer_state.json +3 -0
  27. Qwen-0.5B-GRPO/checkpoint-1400/training_args.bin +3 -0
  28. Qwen-0.5B-GRPO/checkpoint-1400/vocab.json +3 -0
Qwen-0.5B-GRPO/checkpoint-1300/added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b
3
+ size 605
Qwen-0.5B-GRPO/checkpoint-1300/config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1853ace95e8460eebf92f339220785c6a904120a5b5655508ee6a66ff8012428
3
+ size 731
Qwen-0.5B-GRPO/checkpoint-1300/generation_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15794d5a480c43c46a7b861e4a564af5c4e8653b47569dea1afcc0fcf83f43d2
3
+ size 242
Qwen-0.5B-GRPO/checkpoint-1300/merges.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5
3
+ size 1671853
Qwen-0.5B-GRPO/checkpoint-1300/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7a94f35969998412a1fd04b1aa0247b4e9f872addcc4b890f8f315fdc5fa489
3
+ size 988097824
Qwen-0.5B-GRPO/checkpoint-1300/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72558107e92911c92a687694ecce7a3bb73437c2266e6e00a6e99de10f250421
3
+ size 1976374202
Qwen-0.5B-GRPO/checkpoint-1300/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38d771eae0eea8ca40011924e6d3bc921cf0b804d8f5d5a80c42b339992ff043
3
+ size 14180
Qwen-0.5B-GRPO/checkpoint-1300/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a034ae66f5fc47c3f8441afa22ada8b2ebf03f9bc9f67600966ddd1f8a2ff64
3
+ size 1064
Qwen-0.5B-GRPO/checkpoint-1300/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a36726f7fe394c1324021cac4a9ee3ad6c4f6285c0d98721f9b0b95888ec9905
3
+ size 496
Qwen-0.5B-GRPO/checkpoint-1300/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63a2951d5edfa5cc0a2346ef872f8c77a2920274cfc3b503b04e3799104dee80
3
+ size 11422060
Qwen-0.5B-GRPO/checkpoint-1300/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f91b80bdb7722bdd0a25d79246fa79e513a7d4d78056b2eac8cbf92767937ab8
3
+ size 7333
Qwen-0.5B-GRPO/checkpoint-1300/trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e654912d010e50e03588ad48a910ede887373dfdaa9a2acc0d646252d91c7706
3
+ size 733055
Qwen-0.5B-GRPO/checkpoint-1300/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03623afc2805403a4077a6c9dcc3f569621622405344041ab9b94e6a9d9c3c56
3
+ size 5560
Qwen-0.5B-GRPO/checkpoint-1300/vocab.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910
3
+ size 2776833
Qwen-0.5B-GRPO/checkpoint-1400/added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b
3
+ size 605
Qwen-0.5B-GRPO/checkpoint-1400/config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1853ace95e8460eebf92f339220785c6a904120a5b5655508ee6a66ff8012428
3
+ size 731
Qwen-0.5B-GRPO/checkpoint-1400/generation_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15794d5a480c43c46a7b861e4a564af5c4e8653b47569dea1afcc0fcf83f43d2
3
+ size 242
Qwen-0.5B-GRPO/checkpoint-1400/merges.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5
3
+ size 1671853
Qwen-0.5B-GRPO/checkpoint-1400/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c13f8b84cf516a614a4d3f15fd0eb7faaed805fd3192bc7858bba68dda70b76b
3
+ size 988097824
Qwen-0.5B-GRPO/checkpoint-1400/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6bc97d5f56783724faa0f5aec1fd167058c124638429c6d71b50ab929b9a570
3
+ size 1976374202
Qwen-0.5B-GRPO/checkpoint-1400/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8c41580160edc0701a0b7a870f6bb2f4ec5948a1fc9f6ca60f27e12fc91280b
3
+ size 14180
Qwen-0.5B-GRPO/checkpoint-1400/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98feb2ddbb5f2437cbcd9244ca9c06275520bb07751b2c1bcc3a8b1e096245ba
3
+ size 1064
Qwen-0.5B-GRPO/checkpoint-1400/special_tokens_map.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a36726f7fe394c1324021cac4a9ee3ad6c4f6285c0d98721f9b0b95888ec9905
3
+ size 496
Qwen-0.5B-GRPO/checkpoint-1400/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63a2951d5edfa5cc0a2346ef872f8c77a2920274cfc3b503b04e3799104dee80
3
+ size 11422060
Qwen-0.5B-GRPO/checkpoint-1400/tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f91b80bdb7722bdd0a25d79246fa79e513a7d4d78056b2eac8cbf92767937ab8
3
+ size 7333
Qwen-0.5B-GRPO/checkpoint-1400/trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0eab666fdf64aadb58ce8f6f545dcd74e4ae26764cd57f40fdbf096ca21556d
3
+ size 789868
Qwen-0.5B-GRPO/checkpoint-1400/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03623afc2805403a4077a6c9dcc3f569621622405344041ab9b94e6a9d9c3c56
3
+ size 5560
Qwen-0.5B-GRPO/checkpoint-1400/vocab.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910
3
+ size 2776833