Archit1243 commited on
Commit
2e944df
·
verified ·
1 Parent(s): b1ae9f1

/mistral-MCQ

Browse files
README.md CHANGED
@@ -44,14 +44,10 @@ The following hyperparameters were used during training:
44
  - lr_scheduler_warmup_ratio: 0.03
45
  - num_epochs: 1
46
 
47
- ### Training results
48
-
49
-
50
-
51
  ### Framework versions
52
 
53
  - PEFT 0.10.0
54
  - Transformers 4.39.3
55
- - Pytorch 2.2.1+cu121
56
  - Datasets 2.18.0
57
  - Tokenizers 0.15.2
 
44
  - lr_scheduler_warmup_ratio: 0.03
45
  - num_epochs: 1
46
 
 
 
 
 
47
  ### Framework versions
48
 
49
  - PEFT 0.10.0
50
  - Transformers 4.39.3
51
+ - Pytorch 2.1.2
52
  - Datasets 2.18.0
53
  - Tokenizers 0.15.2
adapter_config.json CHANGED
@@ -20,11 +20,11 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "gate_proj",
24
- "v_proj",
25
  "o_proj",
26
  "k_proj",
27
- "q_proj"
 
 
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
23
  "o_proj",
24
  "k_proj",
25
+ "gate_proj",
26
+ "q_proj",
27
+ "v_proj"
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ad6dc61cea4ea7ae2238a64b517642fe244e1ca2075248f6fad18a1c397f3de
3
  size 369142184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5380716c2fe7bfff8528b061ce0167c0958bc28dee633cfa6375117df1a78c48
3
  size 369142184
runs/Apr09_15-43-08_a102a0159da3/events.out.tfevents.1712677424.a102a0159da3.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72608cceeb845f8293a3a39db499a4a75b9f438d6d3b2185fb52bdd2f26df7c3
3
+ size 5080
tokenizer.json CHANGED
@@ -62,12 +62,6 @@
62
  "id": "A",
63
  "type_id": 0
64
  }
65
- },
66
- {
67
- "SpecialToken": {
68
- "id": "</s>",
69
- "type_id": 0
70
- }
71
  }
72
  ],
73
  "pair": [
@@ -83,12 +77,6 @@
83
  "type_id": 0
84
  }
85
  },
86
- {
87
- "SpecialToken": {
88
- "id": "</s>",
89
- "type_id": 0
90
- }
91
- },
92
  {
93
  "SpecialToken": {
94
  "id": "<s>",
@@ -100,24 +88,9 @@
100
  "id": "B",
101
  "type_id": 1
102
  }
103
- },
104
- {
105
- "SpecialToken": {
106
- "id": "</s>",
107
- "type_id": 1
108
- }
109
  }
110
  ],
111
  "special_tokens": {
112
- "</s>": {
113
- "id": "</s>",
114
- "ids": [
115
- 2
116
- ],
117
- "tokens": [
118
- "</s>"
119
- ]
120
- },
121
  "<s>": {
122
  "id": "<s>",
123
  "ids": [
 
62
  "id": "A",
63
  "type_id": 0
64
  }
 
 
 
 
 
 
65
  }
66
  ],
67
  "pair": [
 
77
  "type_id": 0
78
  }
79
  },
 
 
 
 
 
 
80
  {
81
  "SpecialToken": {
82
  "id": "<s>",
 
88
  "id": "B",
89
  "type_id": 1
90
  }
 
 
 
 
 
 
91
  }
92
  ],
93
  "special_tokens": {
 
 
 
 
 
 
 
 
 
94
  "<s>": {
95
  "id": "<s>",
96
  "ids": [
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
+ size 493443
tokenizer_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "add_bos_token": true,
3
- "add_eos_token": true,
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",
 
1
  {
2
  "add_bos_token": true,
3
+ "add_eos_token": false,
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc6752991eb064f5476769d7bdc3f881a5f6821059c2fbf90ac4c76ad27f8f94
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:654fc96c5593be9115eb856819ecd76b107cb665c1b86b1ffae8fa30d1f266b6
3
  size 4920