BenjaminB HF staff commited on
Commit
12390f5
1 Parent(s): aa08448

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. adalora_mlp/0.6.2/README.md +206 -0
  2. adalora_mlp/0.6.2/adapter_config.json +34 -0
  3. adalora_mlp/0.6.2/adapter_model.safetensors +3 -0
  4. adalora_mlp/0.6.2/output.pt +3 -0
  5. adalora_opt-350m/0.6.2/README.md +207 -0
  6. adalora_opt-350m/0.6.2/adapter_config.json +39 -0
  7. adalora_opt-350m/0.6.2/adapter_model.safetensors +3 -0
  8. adalora_opt-350m/0.6.2/output.pt +3 -0
  9. ia3_conv2d/0.6.2/README.md +206 -0
  10. ia3_conv2d/0.6.2/adapter_config.json +20 -0
  11. ia3_conv2d/0.6.2/adapter_model.safetensors +3 -0
  12. ia3_conv2d/0.6.2/output.pt +3 -0
  13. ia3_mlp/0.6.2/README.md +206 -0
  14. ia3_mlp/0.6.2/adapter_config.json +20 -0
  15. ia3_mlp/0.6.2/adapter_model.safetensors +3 -0
  16. ia3_mlp/0.6.2/output.pt +3 -0
  17. ia3_no_ff_mlp/0.6.2/README.md +206 -0
  18. ia3_no_ff_mlp/0.6.2/adapter_config.json +18 -0
  19. ia3_no_ff_mlp/0.6.2/adapter_model.safetensors +3 -0
  20. ia3_no_ff_mlp/0.6.2/output.pt +3 -0
  21. ia3_opt-350m/0.6.2/README.md +207 -0
  22. ia3_opt-350m/0.6.2/adapter_config.json +22 -0
  23. ia3_opt-350m/0.6.2/adapter_model.safetensors +3 -0
  24. ia3_opt-350m/0.6.2/output.pt +3 -0
  25. lora_conv2d/0.6.2/README.md +206 -0
  26. lora_conv2d/0.6.2/adapter_config.json +25 -0
  27. lora_conv2d/0.6.2/adapter_model.safetensors +3 -0
  28. lora_conv2d/0.6.2/output.pt +3 -0
  29. lora_emb_conv1d/0.6.2/README.md +206 -0
  30. lora_emb_conv1d/0.6.2/adapter_config.json +26 -0
  31. lora_emb_conv1d/0.6.2/adapter_model.safetensors +3 -0
  32. lora_emb_conv1d/0.6.2/output.pt +3 -0
  33. lora_mlp/0.6.2/README.md +206 -0
  34. lora_mlp/0.6.2/adapter_config.json +25 -0
  35. lora_mlp/0.6.2/adapter_model.safetensors +3 -0
  36. lora_mlp/0.6.2/output.pt +3 -0
  37. lora_mlp_modules_to_save/0.6.2/README.md +206 -0
  38. lora_mlp_modules_to_save/0.6.2/adapter_config.json +27 -0
  39. lora_mlp_modules_to_save/0.6.2/adapter_model.safetensors +3 -0
  40. lora_mlp_modules_to_save/0.6.2/output.pt +3 -0
  41. lora_opt-350m/0.6.2/README.md +207 -0
  42. lora_opt-350m/0.6.2/adapter_config.json +26 -0
  43. lora_opt-350m/0.6.2/adapter_model.safetensors +3 -0
  44. lora_opt-350m/0.6.2/output.pt +3 -0
  45. lora_opt-350m_bnb_4bit/0.6.2/README.md +219 -0
  46. lora_opt-350m_bnb_4bit/0.6.2/adapter_config.json +26 -0
  47. lora_opt-350m_bnb_4bit/0.6.2/adapter_model.safetensors +3 -0
  48. lora_opt-350m_bnb_4bit/0.6.2/output.pt +3 -0
  49. lora_opt-350m_bnb_8bit/0.6.2/README.md +219 -0
  50. lora_opt-350m_bnb_8bit/0.6.2/adapter_config.json +26 -0
adalora_mlp/0.6.2/README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ ---
4
+
5
+ # Model Card for Model ID
6
+
7
+ <!-- Provide a quick summary of what the model is/does. -->
8
+
9
+
10
+
11
+ ## Model Details
12
+
13
+ ### Model Description
14
+
15
+ <!-- Provide a longer summary of what this model is. -->
16
+
17
+
18
+
19
+ - **Developed by:** [More Information Needed]
20
+ - **Shared by [optional]:** [More Information Needed]
21
+ - **Model type:** [More Information Needed]
22
+ - **Language(s) (NLP):** [More Information Needed]
23
+ - **License:** [More Information Needed]
24
+ - **Finetuned from model [optional]:** [More Information Needed]
25
+
26
+ ### Model Sources [optional]
27
+
28
+ <!-- Provide the basic links for the model. -->
29
+
30
+ - **Repository:** [More Information Needed]
31
+ - **Paper [optional]:** [More Information Needed]
32
+ - **Demo [optional]:** [More Information Needed]
33
+
34
+ ## Uses
35
+
36
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
37
+
38
+ ### Direct Use
39
+
40
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
41
+
42
+ [More Information Needed]
43
+
44
+ ### Downstream Use [optional]
45
+
46
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
47
+
48
+ [More Information Needed]
49
+
50
+ ### Out-of-Scope Use
51
+
52
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
53
+
54
+ [More Information Needed]
55
+
56
+ ## Bias, Risks, and Limitations
57
+
58
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
59
+
60
+ [More Information Needed]
61
+
62
+ ### Recommendations
63
+
64
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
65
+
66
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
67
+
68
+ ## How to Get Started with the Model
69
+
70
+ Use the code below to get started with the model.
71
+
72
+ [More Information Needed]
73
+
74
+ ## Training Details
75
+
76
+ ### Training Data
77
+
78
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
79
+
80
+ [More Information Needed]
81
+
82
+ ### Training Procedure
83
+
84
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
85
+
86
+ #### Preprocessing [optional]
87
+
88
+ [More Information Needed]
89
+
90
+
91
+ #### Training Hyperparameters
92
+
93
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
94
+
95
+ #### Speeds, Sizes, Times [optional]
96
+
97
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
98
+
99
+ [More Information Needed]
100
+
101
+ ## Evaluation
102
+
103
+ <!-- This section describes the evaluation protocols and provides the results. -->
104
+
105
+ ### Testing Data, Factors & Metrics
106
+
107
+ #### Testing Data
108
+
109
+ <!-- This should link to a Data Card if possible. -->
110
+
111
+ [More Information Needed]
112
+
113
+ #### Factors
114
+
115
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
116
+
117
+ [More Information Needed]
118
+
119
+ #### Metrics
120
+
121
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
122
+
123
+ [More Information Needed]
124
+
125
+ ### Results
126
+
127
+ [More Information Needed]
128
+
129
+ #### Summary
130
+
131
+
132
+
133
+ ## Model Examination [optional]
134
+
135
+ <!-- Relevant interpretability work for the model goes here -->
136
+
137
+ [More Information Needed]
138
+
139
+ ## Environmental Impact
140
+
141
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
142
+
143
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
144
+
145
+ - **Hardware Type:** [More Information Needed]
146
+ - **Hours used:** [More Information Needed]
147
+ - **Cloud Provider:** [More Information Needed]
148
+ - **Compute Region:** [More Information Needed]
149
+ - **Carbon Emitted:** [More Information Needed]
150
+
151
+ ## Technical Specifications [optional]
152
+
153
+ ### Model Architecture and Objective
154
+
155
+ [More Information Needed]
156
+
157
+ ### Compute Infrastructure
158
+
159
+ [More Information Needed]
160
+
161
+ #### Hardware
162
+
163
+ [More Information Needed]
164
+
165
+ #### Software
166
+
167
+ [More Information Needed]
168
+
169
+ ## Citation [optional]
170
+
171
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
172
+
173
+ **BibTeX:**
174
+
175
+ [More Information Needed]
176
+
177
+ **APA:**
178
+
179
+ [More Information Needed]
180
+
181
+ ## Glossary [optional]
182
+
183
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
184
+
185
+ [More Information Needed]
186
+
187
+ ## More Information [optional]
188
+
189
+ [More Information Needed]
190
+
191
+ ## Model Card Authors [optional]
192
+
193
+ [More Information Needed]
194
+
195
+ ## Model Card Contact
196
+
197
+ [More Information Needed]
198
+
199
+
200
+ ## Training procedure
201
+
202
+
203
+ ### Framework versions
204
+
205
+
206
+ - PEFT 0.6.2
adalora_mlp/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "MLP",
5
+ "parent_library": "test_regression"
6
+ },
7
+ "base_model_name_or_path": null,
8
+ "beta1": 0.85,
9
+ "beta2": 0.85,
10
+ "bias": "none",
11
+ "deltaT": 1,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": false,
15
+ "init_r": 12,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "lora_alpha": 8,
19
+ "lora_dropout": 0.0,
20
+ "modules_to_save": null,
21
+ "orth_reg_weight": 0.5,
22
+ "peft_type": "ADALORA",
23
+ "r": 8,
24
+ "rank_pattern": null,
25
+ "revision": null,
26
+ "target_modules": [
27
+ "lin0"
28
+ ],
29
+ "target_r": 8,
30
+ "task_type": null,
31
+ "tfinal": 0,
32
+ "tinit": 0,
33
+ "total_step": null
34
+ }
adalora_mlp/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9479f2503c55f4c63e0a5682c3855910de00377f39aee2ea9687412f45bb8d4
3
+ size 1792
adalora_mlp/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c90d9caa327c2bc1237d69be84caaa5ea3b9110f3b0ef3036e3349bf528c97ee
3
+ size 1239
adalora_opt-350m/0.6.2/README.md ADDED
@@ -0,0 +1,207 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ base_model: facebook/opt-350m
4
+ ---
5
+
6
+ # Model Card for Model ID
7
+
8
+ <!-- Provide a quick summary of what the model is/does. -->
9
+
10
+
11
+
12
+ ## Model Details
13
+
14
+ ### Model Description
15
+
16
+ <!-- Provide a longer summary of what this model is. -->
17
+
18
+
19
+
20
+ - **Developed by:** [More Information Needed]
21
+ - **Shared by [optional]:** [More Information Needed]
22
+ - **Model type:** [More Information Needed]
23
+ - **Language(s) (NLP):** [More Information Needed]
24
+ - **License:** [More Information Needed]
25
+ - **Finetuned from model [optional]:** [More Information Needed]
26
+
27
+ ### Model Sources [optional]
28
+
29
+ <!-- Provide the basic links for the model. -->
30
+
31
+ - **Repository:** [More Information Needed]
32
+ - **Paper [optional]:** [More Information Needed]
33
+ - **Demo [optional]:** [More Information Needed]
34
+
35
+ ## Uses
36
+
37
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
38
+
39
+ ### Direct Use
40
+
41
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
42
+
43
+ [More Information Needed]
44
+
45
+ ### Downstream Use [optional]
46
+
47
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
48
+
49
+ [More Information Needed]
50
+
51
+ ### Out-of-Scope Use
52
+
53
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
54
+
55
+ [More Information Needed]
56
+
57
+ ## Bias, Risks, and Limitations
58
+
59
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
60
+
61
+ [More Information Needed]
62
+
63
+ ### Recommendations
64
+
65
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
66
+
67
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
68
+
69
+ ## How to Get Started with the Model
70
+
71
+ Use the code below to get started with the model.
72
+
73
+ [More Information Needed]
74
+
75
+ ## Training Details
76
+
77
+ ### Training Data
78
+
79
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
80
+
81
+ [More Information Needed]
82
+
83
+ ### Training Procedure
84
+
85
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
86
+
87
+ #### Preprocessing [optional]
88
+
89
+ [More Information Needed]
90
+
91
+
92
+ #### Training Hyperparameters
93
+
94
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
95
+
96
+ #### Speeds, Sizes, Times [optional]
97
+
98
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
99
+
100
+ [More Information Needed]
101
+
102
+ ## Evaluation
103
+
104
+ <!-- This section describes the evaluation protocols and provides the results. -->
105
+
106
+ ### Testing Data, Factors & Metrics
107
+
108
+ #### Testing Data
109
+
110
+ <!-- This should link to a Data Card if possible. -->
111
+
112
+ [More Information Needed]
113
+
114
+ #### Factors
115
+
116
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
117
+
118
+ [More Information Needed]
119
+
120
+ #### Metrics
121
+
122
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
123
+
124
+ [More Information Needed]
125
+
126
+ ### Results
127
+
128
+ [More Information Needed]
129
+
130
+ #### Summary
131
+
132
+
133
+
134
+ ## Model Examination [optional]
135
+
136
+ <!-- Relevant interpretability work for the model goes here -->
137
+
138
+ [More Information Needed]
139
+
140
+ ## Environmental Impact
141
+
142
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
143
+
144
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
145
+
146
+ - **Hardware Type:** [More Information Needed]
147
+ - **Hours used:** [More Information Needed]
148
+ - **Cloud Provider:** [More Information Needed]
149
+ - **Compute Region:** [More Information Needed]
150
+ - **Carbon Emitted:** [More Information Needed]
151
+
152
+ ## Technical Specifications [optional]
153
+
154
+ ### Model Architecture and Objective
155
+
156
+ [More Information Needed]
157
+
158
+ ### Compute Infrastructure
159
+
160
+ [More Information Needed]
161
+
162
+ #### Hardware
163
+
164
+ [More Information Needed]
165
+
166
+ #### Software
167
+
168
+ [More Information Needed]
169
+
170
+ ## Citation [optional]
171
+
172
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
173
+
174
+ **BibTeX:**
175
+
176
+ [More Information Needed]
177
+
178
+ **APA:**
179
+
180
+ [More Information Needed]
181
+
182
+ ## Glossary [optional]
183
+
184
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
185
+
186
+ [More Information Needed]
187
+
188
+ ## More Information [optional]
189
+
190
+ [More Information Needed]
191
+
192
+ ## Model Card Authors [optional]
193
+
194
+ [More Information Needed]
195
+
196
+ ## Model Card Contact
197
+
198
+ [More Information Needed]
199
+
200
+
201
+ ## Training procedure
202
+
203
+
204
+ ### Framework versions
205
+
206
+
207
+ - PEFT 0.6.2
adalora_opt-350m/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "OPTForCausalLM",
5
+ "parent_library": "transformers.models.opt.modeling_opt"
6
+ },
7
+ "base_model_name_or_path": "facebook/opt-350m",
8
+ "beta1": 0.85,
9
+ "beta2": 0.85,
10
+ "bias": "none",
11
+ "deltaT": 1,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": false,
15
+ "init_r": 12,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "lora_alpha": 8,
19
+ "lora_dropout": 0.0,
20
+ "modules_to_save": null,
21
+ "orth_reg_weight": 0.5,
22
+ "peft_type": "ADALORA",
23
+ "r": 8,
24
+ "rank_pattern": null,
25
+ "revision": null,
26
+ "target_modules": [
27
+ "q_proj",
28
+ "k_proj",
29
+ "v_proj",
30
+ "out_proj",
31
+ "fc1",
32
+ "fc2"
33
+ ],
34
+ "target_r": 8,
35
+ "task_type": null,
36
+ "tfinal": 0,
37
+ "tinit": 0,
38
+ "total_step": null
39
+ }
adalora_opt-350m/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b95942c9e2029d128034ec7ab28b882a763ccd18aa6dc0eb5c47dc66a89479ba
3
+ size 21296584
adalora_opt-350m/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45cd059248e254577130528f6b9b6ab434bda781523f9e33e6ba47c67b429ff8
3
+ size 1207639
ia3_conv2d/0.6.2/README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ ---
4
+
5
+ # Model Card for Model ID
6
+
7
+ <!-- Provide a quick summary of what the model is/does. -->
8
+
9
+
10
+
11
+ ## Model Details
12
+
13
+ ### Model Description
14
+
15
+ <!-- Provide a longer summary of what this model is. -->
16
+
17
+
18
+
19
+ - **Developed by:** [More Information Needed]
20
+ - **Shared by [optional]:** [More Information Needed]
21
+ - **Model type:** [More Information Needed]
22
+ - **Language(s) (NLP):** [More Information Needed]
23
+ - **License:** [More Information Needed]
24
+ - **Finetuned from model [optional]:** [More Information Needed]
25
+
26
+ ### Model Sources [optional]
27
+
28
+ <!-- Provide the basic links for the model. -->
29
+
30
+ - **Repository:** [More Information Needed]
31
+ - **Paper [optional]:** [More Information Needed]
32
+ - **Demo [optional]:** [More Information Needed]
33
+
34
+ ## Uses
35
+
36
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
37
+
38
+ ### Direct Use
39
+
40
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
41
+
42
+ [More Information Needed]
43
+
44
+ ### Downstream Use [optional]
45
+
46
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
47
+
48
+ [More Information Needed]
49
+
50
+ ### Out-of-Scope Use
51
+
52
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
53
+
54
+ [More Information Needed]
55
+
56
+ ## Bias, Risks, and Limitations
57
+
58
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
59
+
60
+ [More Information Needed]
61
+
62
+ ### Recommendations
63
+
64
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
65
+
66
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
67
+
68
+ ## How to Get Started with the Model
69
+
70
+ Use the code below to get started with the model.
71
+
72
+ [More Information Needed]
73
+
74
+ ## Training Details
75
+
76
+ ### Training Data
77
+
78
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
79
+
80
+ [More Information Needed]
81
+
82
+ ### Training Procedure
83
+
84
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
85
+
86
+ #### Preprocessing [optional]
87
+
88
+ [More Information Needed]
89
+
90
+
91
+ #### Training Hyperparameters
92
+
93
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
94
+
95
+ #### Speeds, Sizes, Times [optional]
96
+
97
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
98
+
99
+ [More Information Needed]
100
+
101
+ ## Evaluation
102
+
103
+ <!-- This section describes the evaluation protocols and provides the results. -->
104
+
105
+ ### Testing Data, Factors & Metrics
106
+
107
+ #### Testing Data
108
+
109
+ <!-- This should link to a Data Card if possible. -->
110
+
111
+ [More Information Needed]
112
+
113
+ #### Factors
114
+
115
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
116
+
117
+ [More Information Needed]
118
+
119
+ #### Metrics
120
+
121
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
122
+
123
+ [More Information Needed]
124
+
125
+ ### Results
126
+
127
+ [More Information Needed]
128
+
129
+ #### Summary
130
+
131
+
132
+
133
+ ## Model Examination [optional]
134
+
135
+ <!-- Relevant interpretability work for the model goes here -->
136
+
137
+ [More Information Needed]
138
+
139
+ ## Environmental Impact
140
+
141
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
142
+
143
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
144
+
145
+ - **Hardware Type:** [More Information Needed]
146
+ - **Hours used:** [More Information Needed]
147
+ - **Cloud Provider:** [More Information Needed]
148
+ - **Compute Region:** [More Information Needed]
149
+ - **Carbon Emitted:** [More Information Needed]
150
+
151
+ ## Technical Specifications [optional]
152
+
153
+ ### Model Architecture and Objective
154
+
155
+ [More Information Needed]
156
+
157
+ ### Compute Infrastructure
158
+
159
+ [More Information Needed]
160
+
161
+ #### Hardware
162
+
163
+ [More Information Needed]
164
+
165
+ #### Software
166
+
167
+ [More Information Needed]
168
+
169
+ ## Citation [optional]
170
+
171
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
172
+
173
+ **BibTeX:**
174
+
175
+ [More Information Needed]
176
+
177
+ **APA:**
178
+
179
+ [More Information Needed]
180
+
181
+ ## Glossary [optional]
182
+
183
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
184
+
185
+ [More Information Needed]
186
+
187
+ ## More Information [optional]
188
+
189
+ [More Information Needed]
190
+
191
+ ## Model Card Authors [optional]
192
+
193
+ [More Information Needed]
194
+
195
+ ## Model Card Contact
196
+
197
+ [More Information Needed]
198
+
199
+
200
+ ## Training procedure
201
+
202
+
203
+ ### Framework versions
204
+
205
+
206
+ - PEFT 0.6.2
ia3_conv2d/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "auto_mapping": {
3
+ "base_model_class": "ModelConv2D",
4
+ "parent_library": "test_regression"
5
+ },
6
+ "base_model_name_or_path": null,
7
+ "fan_in_fan_out": false,
8
+ "feedforward_modules": [
9
+ "conv2d"
10
+ ],
11
+ "inference_mode": true,
12
+ "init_ia3_weights": false,
13
+ "modules_to_save": null,
14
+ "peft_type": "IA3",
15
+ "revision": null,
16
+ "target_modules": [
17
+ "conv2d"
18
+ ],
19
+ "task_type": null
20
+ }
ia3_conv2d/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b3d25f99cd10353987666d320c8ae6f7a2e61129836888af543059a6d2233ed
3
+ size 148
ia3_conv2d/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6aeaa649528f43b5360de6d40aa805ac7bb1a9a98799172df77d04c21324a308
3
+ size 1175
ia3_mlp/0.6.2/README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ ---
4
+
5
+ # Model Card for Model ID
6
+
7
+ <!-- Provide a quick summary of what the model is/does. -->
8
+
9
+
10
+
11
+ ## Model Details
12
+
13
+ ### Model Description
14
+
15
+ <!-- Provide a longer summary of what this model is. -->
16
+
17
+
18
+
19
+ - **Developed by:** [More Information Needed]
20
+ - **Shared by [optional]:** [More Information Needed]
21
+ - **Model type:** [More Information Needed]
22
+ - **Language(s) (NLP):** [More Information Needed]
23
+ - **License:** [More Information Needed]
24
+ - **Finetuned from model [optional]:** [More Information Needed]
25
+
26
+ ### Model Sources [optional]
27
+
28
+ <!-- Provide the basic links for the model. -->
29
+
30
+ - **Repository:** [More Information Needed]
31
+ - **Paper [optional]:** [More Information Needed]
32
+ - **Demo [optional]:** [More Information Needed]
33
+
34
+ ## Uses
35
+
36
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
37
+
38
+ ### Direct Use
39
+
40
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
41
+
42
+ [More Information Needed]
43
+
44
+ ### Downstream Use [optional]
45
+
46
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
47
+
48
+ [More Information Needed]
49
+
50
+ ### Out-of-Scope Use
51
+
52
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
53
+
54
+ [More Information Needed]
55
+
56
+ ## Bias, Risks, and Limitations
57
+
58
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
59
+
60
+ [More Information Needed]
61
+
62
+ ### Recommendations
63
+
64
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
65
+
66
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
67
+
68
+ ## How to Get Started with the Model
69
+
70
+ Use the code below to get started with the model.
71
+
72
+ [More Information Needed]
73
+
74
+ ## Training Details
75
+
76
+ ### Training Data
77
+
78
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
79
+
80
+ [More Information Needed]
81
+
82
+ ### Training Procedure
83
+
84
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
85
+
86
+ #### Preprocessing [optional]
87
+
88
+ [More Information Needed]
89
+
90
+
91
+ #### Training Hyperparameters
92
+
93
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
94
+
95
+ #### Speeds, Sizes, Times [optional]
96
+
97
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
98
+
99
+ [More Information Needed]
100
+
101
+ ## Evaluation
102
+
103
+ <!-- This section describes the evaluation protocols and provides the results. -->
104
+
105
+ ### Testing Data, Factors & Metrics
106
+
107
+ #### Testing Data
108
+
109
+ <!-- This should link to a Data Card if possible. -->
110
+
111
+ [More Information Needed]
112
+
113
+ #### Factors
114
+
115
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
116
+
117
+ [More Information Needed]
118
+
119
+ #### Metrics
120
+
121
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
122
+
123
+ [More Information Needed]
124
+
125
+ ### Results
126
+
127
+ [More Information Needed]
128
+
129
+ #### Summary
130
+
131
+
132
+
133
+ ## Model Examination [optional]
134
+
135
+ <!-- Relevant interpretability work for the model goes here -->
136
+
137
+ [More Information Needed]
138
+
139
+ ## Environmental Impact
140
+
141
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
142
+
143
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
144
+
145
+ - **Hardware Type:** [More Information Needed]
146
+ - **Hours used:** [More Information Needed]
147
+ - **Cloud Provider:** [More Information Needed]
148
+ - **Compute Region:** [More Information Needed]
149
+ - **Carbon Emitted:** [More Information Needed]
150
+
151
+ ## Technical Specifications [optional]
152
+
153
+ ### Model Architecture and Objective
154
+
155
+ [More Information Needed]
156
+
157
+ ### Compute Infrastructure
158
+
159
+ [More Information Needed]
160
+
161
+ #### Hardware
162
+
163
+ [More Information Needed]
164
+
165
+ #### Software
166
+
167
+ [More Information Needed]
168
+
169
+ ## Citation [optional]
170
+
171
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
172
+
173
+ **BibTeX:**
174
+
175
+ [More Information Needed]
176
+
177
+ **APA:**
178
+
179
+ [More Information Needed]
180
+
181
+ ## Glossary [optional]
182
+
183
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
184
+
185
+ [More Information Needed]
186
+
187
+ ## More Information [optional]
188
+
189
+ [More Information Needed]
190
+
191
+ ## Model Card Authors [optional]
192
+
193
+ [More Information Needed]
194
+
195
+ ## Model Card Contact
196
+
197
+ [More Information Needed]
198
+
199
+
200
+ ## Training procedure
201
+
202
+
203
+ ### Framework versions
204
+
205
+
206
+ - PEFT 0.6.2
ia3_mlp/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "auto_mapping": {
3
+ "base_model_class": "MLP",
4
+ "parent_library": "test_regression"
5
+ },
6
+ "base_model_name_or_path": null,
7
+ "fan_in_fan_out": false,
8
+ "feedforward_modules": [
9
+ "lin0"
10
+ ],
11
+ "inference_mode": true,
12
+ "init_ia3_weights": false,
13
+ "modules_to_save": null,
14
+ "peft_type": "IA3",
15
+ "revision": null,
16
+ "target_modules": [
17
+ "lin0"
18
+ ],
19
+ "task_type": null
20
+ }
ia3_mlp/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f37cf4c827d5730fde053cc5e43926b7a329255bdf39a77b24d504d19ccda746
3
+ size 168
ia3_mlp/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d37ff05838c1628679f56a34b0e5c8e13f5cd9814216faa88d43a696dce9764
3
+ size 1239
ia3_no_ff_mlp/0.6.2/README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ ---
4
+
5
+ # Model Card for Model ID
6
+
7
+ <!-- Provide a quick summary of what the model is/does. -->
8
+
9
+
10
+
11
+ ## Model Details
12
+
13
+ ### Model Description
14
+
15
+ <!-- Provide a longer summary of what this model is. -->
16
+
17
+
18
+
19
+ - **Developed by:** [More Information Needed]
20
+ - **Shared by [optional]:** [More Information Needed]
21
+ - **Model type:** [More Information Needed]
22
+ - **Language(s) (NLP):** [More Information Needed]
23
+ - **License:** [More Information Needed]
24
+ - **Finetuned from model [optional]:** [More Information Needed]
25
+
26
+ ### Model Sources [optional]
27
+
28
+ <!-- Provide the basic links for the model. -->
29
+
30
+ - **Repository:** [More Information Needed]
31
+ - **Paper [optional]:** [More Information Needed]
32
+ - **Demo [optional]:** [More Information Needed]
33
+
34
+ ## Uses
35
+
36
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
37
+
38
+ ### Direct Use
39
+
40
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
41
+
42
+ [More Information Needed]
43
+
44
+ ### Downstream Use [optional]
45
+
46
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
47
+
48
+ [More Information Needed]
49
+
50
+ ### Out-of-Scope Use
51
+
52
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
53
+
54
+ [More Information Needed]
55
+
56
+ ## Bias, Risks, and Limitations
57
+
58
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
59
+
60
+ [More Information Needed]
61
+
62
+ ### Recommendations
63
+
64
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
65
+
66
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
67
+
68
+ ## How to Get Started with the Model
69
+
70
+ Use the code below to get started with the model.
71
+
72
+ [More Information Needed]
73
+
74
+ ## Training Details
75
+
76
+ ### Training Data
77
+
78
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
79
+
80
+ [More Information Needed]
81
+
82
+ ### Training Procedure
83
+
84
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
85
+
86
+ #### Preprocessing [optional]
87
+
88
+ [More Information Needed]
89
+
90
+
91
+ #### Training Hyperparameters
92
+
93
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
94
+
95
+ #### Speeds, Sizes, Times [optional]
96
+
97
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
98
+
99
+ [More Information Needed]
100
+
101
+ ## Evaluation
102
+
103
+ <!-- This section describes the evaluation protocols and provides the results. -->
104
+
105
+ ### Testing Data, Factors & Metrics
106
+
107
+ #### Testing Data
108
+
109
+ <!-- This should link to a Data Card if possible. -->
110
+
111
+ [More Information Needed]
112
+
113
+ #### Factors
114
+
115
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
116
+
117
+ [More Information Needed]
118
+
119
+ #### Metrics
120
+
121
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
122
+
123
+ [More Information Needed]
124
+
125
+ ### Results
126
+
127
+ [More Information Needed]
128
+
129
+ #### Summary
130
+
131
+
132
+
133
+ ## Model Examination [optional]
134
+
135
+ <!-- Relevant interpretability work for the model goes here -->
136
+
137
+ [More Information Needed]
138
+
139
+ ## Environmental Impact
140
+
141
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
142
+
143
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
144
+
145
+ - **Hardware Type:** [More Information Needed]
146
+ - **Hours used:** [More Information Needed]
147
+ - **Cloud Provider:** [More Information Needed]
148
+ - **Compute Region:** [More Information Needed]
149
+ - **Carbon Emitted:** [More Information Needed]
150
+
151
+ ## Technical Specifications [optional]
152
+
153
+ ### Model Architecture and Objective
154
+
155
+ [More Information Needed]
156
+
157
+ ### Compute Infrastructure
158
+
159
+ [More Information Needed]
160
+
161
+ #### Hardware
162
+
163
+ [More Information Needed]
164
+
165
+ #### Software
166
+
167
+ [More Information Needed]
168
+
169
+ ## Citation [optional]
170
+
171
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
172
+
173
+ **BibTeX:**
174
+
175
+ [More Information Needed]
176
+
177
+ **APA:**
178
+
179
+ [More Information Needed]
180
+
181
+ ## Glossary [optional]
182
+
183
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
184
+
185
+ [More Information Needed]
186
+
187
+ ## More Information [optional]
188
+
189
+ [More Information Needed]
190
+
191
+ ## Model Card Authors [optional]
192
+
193
+ [More Information Needed]
194
+
195
+ ## Model Card Contact
196
+
197
+ [More Information Needed]
198
+
199
+
200
+ ## Training procedure
201
+
202
+
203
+ ### Framework versions
204
+
205
+
206
+ - PEFT 0.6.2
ia3_no_ff_mlp/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "auto_mapping": {
3
+ "base_model_class": "MLP",
4
+ "parent_library": "test_regression"
5
+ },
6
+ "base_model_name_or_path": null,
7
+ "fan_in_fan_out": false,
8
+ "feedforward_modules": [],
9
+ "inference_mode": true,
10
+ "init_ia3_weights": false,
11
+ "modules_to_save": null,
12
+ "peft_type": "IA3",
13
+ "revision": null,
14
+ "target_modules": [
15
+ "lin0"
16
+ ],
17
+ "task_type": null
18
+ }
ia3_no_ff_mlp/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dd84ea77e8fe4df72057bd6b5a02c633dae2afa33b6d7286f2859c5dd53a8c0
3
+ size 208
ia3_no_ff_mlp/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6916d7bee023d39d11075986bb824a1569bffe25f855ddb956e95c56886a1164
3
+ size 1239
ia3_opt-350m/0.6.2/README.md ADDED
@@ -0,0 +1,207 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ base_model: facebook/opt-350m
4
+ ---
5
+
6
+ # Model Card for Model ID
7
+
8
+ <!-- Provide a quick summary of what the model is/does. -->
9
+
10
+
11
+
12
+ ## Model Details
13
+
14
+ ### Model Description
15
+
16
+ <!-- Provide a longer summary of what this model is. -->
17
+
18
+
19
+
20
+ - **Developed by:** [More Information Needed]
21
+ - **Shared by [optional]:** [More Information Needed]
22
+ - **Model type:** [More Information Needed]
23
+ - **Language(s) (NLP):** [More Information Needed]
24
+ - **License:** [More Information Needed]
25
+ - **Finetuned from model [optional]:** [More Information Needed]
26
+
27
+ ### Model Sources [optional]
28
+
29
+ <!-- Provide the basic links for the model. -->
30
+
31
+ - **Repository:** [More Information Needed]
32
+ - **Paper [optional]:** [More Information Needed]
33
+ - **Demo [optional]:** [More Information Needed]
34
+
35
+ ## Uses
36
+
37
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
38
+
39
+ ### Direct Use
40
+
41
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
42
+
43
+ [More Information Needed]
44
+
45
+ ### Downstream Use [optional]
46
+
47
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
48
+
49
+ [More Information Needed]
50
+
51
+ ### Out-of-Scope Use
52
+
53
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
54
+
55
+ [More Information Needed]
56
+
57
+ ## Bias, Risks, and Limitations
58
+
59
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
60
+
61
+ [More Information Needed]
62
+
63
+ ### Recommendations
64
+
65
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
66
+
67
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
68
+
69
+ ## How to Get Started with the Model
70
+
71
+ Use the code below to get started with the model.
72
+
73
+ [More Information Needed]
74
+
75
+ ## Training Details
76
+
77
+ ### Training Data
78
+
79
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
80
+
81
+ [More Information Needed]
82
+
83
+ ### Training Procedure
84
+
85
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
86
+
87
+ #### Preprocessing [optional]
88
+
89
+ [More Information Needed]
90
+
91
+
92
+ #### Training Hyperparameters
93
+
94
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
95
+
96
+ #### Speeds, Sizes, Times [optional]
97
+
98
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
99
+
100
+ [More Information Needed]
101
+
102
+ ## Evaluation
103
+
104
+ <!-- This section describes the evaluation protocols and provides the results. -->
105
+
106
+ ### Testing Data, Factors & Metrics
107
+
108
+ #### Testing Data
109
+
110
+ <!-- This should link to a Data Card if possible. -->
111
+
112
+ [More Information Needed]
113
+
114
+ #### Factors
115
+
116
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
117
+
118
+ [More Information Needed]
119
+
120
+ #### Metrics
121
+
122
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
123
+
124
+ [More Information Needed]
125
+
126
+ ### Results
127
+
128
+ [More Information Needed]
129
+
130
+ #### Summary
131
+
132
+
133
+
134
+ ## Model Examination [optional]
135
+
136
+ <!-- Relevant interpretability work for the model goes here -->
137
+
138
+ [More Information Needed]
139
+
140
+ ## Environmental Impact
141
+
142
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
143
+
144
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
145
+
146
+ - **Hardware Type:** [More Information Needed]
147
+ - **Hours used:** [More Information Needed]
148
+ - **Cloud Provider:** [More Information Needed]
149
+ - **Compute Region:** [More Information Needed]
150
+ - **Carbon Emitted:** [More Information Needed]
151
+
152
+ ## Technical Specifications [optional]
153
+
154
+ ### Model Architecture and Objective
155
+
156
+ [More Information Needed]
157
+
158
+ ### Compute Infrastructure
159
+
160
+ [More Information Needed]
161
+
162
+ #### Hardware
163
+
164
+ [More Information Needed]
165
+
166
+ #### Software
167
+
168
+ [More Information Needed]
169
+
170
+ ## Citation [optional]
171
+
172
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
173
+
174
+ **BibTeX:**
175
+
176
+ [More Information Needed]
177
+
178
+ **APA:**
179
+
180
+ [More Information Needed]
181
+
182
+ ## Glossary [optional]
183
+
184
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
185
+
186
+ [More Information Needed]
187
+
188
+ ## More Information [optional]
189
+
190
+ [More Information Needed]
191
+
192
+ ## Model Card Authors [optional]
193
+
194
+ [More Information Needed]
195
+
196
+ ## Model Card Contact
197
+
198
+ [More Information Needed]
199
+
200
+
201
+ ## Training procedure
202
+
203
+
204
+ ### Framework versions
205
+
206
+
207
+ - PEFT 0.6.2
ia3_opt-350m/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "auto_mapping": {
3
+ "base_model_class": "OPTForCausalLM",
4
+ "parent_library": "transformers.models.opt.modeling_opt"
5
+ },
6
+ "base_model_name_or_path": "facebook/opt-350m",
7
+ "fan_in_fan_out": false,
8
+ "feedforward_modules": [
9
+ "fc2"
10
+ ],
11
+ "inference_mode": true,
12
+ "init_ia3_weights": false,
13
+ "modules_to_save": null,
14
+ "peft_type": "IA3",
15
+ "revision": null,
16
+ "target_modules": [
17
+ "q_proj",
18
+ "k_proj",
19
+ "fc2"
20
+ ],
21
+ "task_type": null
22
+ }
ia3_opt-350m/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7c93fe9f415a0f029daf4fd99656c672ad297586f1a82e61b0755a6861297c0
3
+ size 598856
ia3_opt-350m/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:227dde8197b0422d4f0e6633b0b2f678a8f2602959003db4528e15e2b6b393ee
3
+ size 1207639
lora_conv2d/0.6.2/README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ ---
4
+
5
+ # Model Card for Model ID
6
+
7
+ <!-- Provide a quick summary of what the model is/does. -->
8
+
9
+
10
+
11
+ ## Model Details
12
+
13
+ ### Model Description
14
+
15
+ <!-- Provide a longer summary of what this model is. -->
16
+
17
+
18
+
19
+ - **Developed by:** [More Information Needed]
20
+ - **Shared by [optional]:** [More Information Needed]
21
+ - **Model type:** [More Information Needed]
22
+ - **Language(s) (NLP):** [More Information Needed]
23
+ - **License:** [More Information Needed]
24
+ - **Finetuned from model [optional]:** [More Information Needed]
25
+
26
+ ### Model Sources [optional]
27
+
28
+ <!-- Provide the basic links for the model. -->
29
+
30
+ - **Repository:** [More Information Needed]
31
+ - **Paper [optional]:** [More Information Needed]
32
+ - **Demo [optional]:** [More Information Needed]
33
+
34
+ ## Uses
35
+
36
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
37
+
38
+ ### Direct Use
39
+
40
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
41
+
42
+ [More Information Needed]
43
+
44
+ ### Downstream Use [optional]
45
+
46
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
47
+
48
+ [More Information Needed]
49
+
50
+ ### Out-of-Scope Use
51
+
52
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
53
+
54
+ [More Information Needed]
55
+
56
+ ## Bias, Risks, and Limitations
57
+
58
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
59
+
60
+ [More Information Needed]
61
+
62
+ ### Recommendations
63
+
64
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
65
+
66
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
67
+
68
+ ## How to Get Started with the Model
69
+
70
+ Use the code below to get started with the model.
71
+
72
+ [More Information Needed]
73
+
74
+ ## Training Details
75
+
76
+ ### Training Data
77
+
78
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
79
+
80
+ [More Information Needed]
81
+
82
+ ### Training Procedure
83
+
84
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
85
+
86
+ #### Preprocessing [optional]
87
+
88
+ [More Information Needed]
89
+
90
+
91
+ #### Training Hyperparameters
92
+
93
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
94
+
95
+ #### Speeds, Sizes, Times [optional]
96
+
97
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
98
+
99
+ [More Information Needed]
100
+
101
+ ## Evaluation
102
+
103
+ <!-- This section describes the evaluation protocols and provides the results. -->
104
+
105
+ ### Testing Data, Factors & Metrics
106
+
107
+ #### Testing Data
108
+
109
+ <!-- This should link to a Data Card if possible. -->
110
+
111
+ [More Information Needed]
112
+
113
+ #### Factors
114
+
115
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
116
+
117
+ [More Information Needed]
118
+
119
+ #### Metrics
120
+
121
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
122
+
123
+ [More Information Needed]
124
+
125
+ ### Results
126
+
127
+ [More Information Needed]
128
+
129
+ #### Summary
130
+
131
+
132
+
133
+ ## Model Examination [optional]
134
+
135
+ <!-- Relevant interpretability work for the model goes here -->
136
+
137
+ [More Information Needed]
138
+
139
+ ## Environmental Impact
140
+
141
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
142
+
143
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
144
+
145
+ - **Hardware Type:** [More Information Needed]
146
+ - **Hours used:** [More Information Needed]
147
+ - **Cloud Provider:** [More Information Needed]
148
+ - **Compute Region:** [More Information Needed]
149
+ - **Carbon Emitted:** [More Information Needed]
150
+
151
+ ## Technical Specifications [optional]
152
+
153
+ ### Model Architecture and Objective
154
+
155
+ [More Information Needed]
156
+
157
+ ### Compute Infrastructure
158
+
159
+ [More Information Needed]
160
+
161
+ #### Hardware
162
+
163
+ [More Information Needed]
164
+
165
+ #### Software
166
+
167
+ [More Information Needed]
168
+
169
+ ## Citation [optional]
170
+
171
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
172
+
173
+ **BibTeX:**
174
+
175
+ [More Information Needed]
176
+
177
+ **APA:**
178
+
179
+ [More Information Needed]
180
+
181
+ ## Glossary [optional]
182
+
183
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
184
+
185
+ [More Information Needed]
186
+
187
+ ## More Information [optional]
188
+
189
+ [More Information Needed]
190
+
191
+ ## Model Card Authors [optional]
192
+
193
+ [More Information Needed]
194
+
195
+ ## Model Card Contact
196
+
197
+ [More Information Needed]
198
+
199
+
200
+ ## Training procedure
201
+
202
+
203
+ ### Framework versions
204
+
205
+
206
+ - PEFT 0.6.2
lora_conv2d/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "ModelConv2D",
5
+ "parent_library": "test_regression"
6
+ },
7
+ "base_model_name_or_path": null,
8
+ "bias": "none",
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": false,
12
+ "layers_pattern": null,
13
+ "layers_to_transform": null,
14
+ "lora_alpha": 8,
15
+ "lora_dropout": 0.0,
16
+ "modules_to_save": null,
17
+ "peft_type": "LORA",
18
+ "r": 8,
19
+ "rank_pattern": {},
20
+ "revision": null,
21
+ "target_modules": [
22
+ "conv2d"
23
+ ],
24
+ "task_type": null
25
+ }
lora_conv2d/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd9b1435a896564dff9bd097ac96ad1b330ab458a4d42fefb95f23a5e88d310e
3
+ size 2000
lora_conv2d/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1133f060fa4c33a00d693a12f1ce5da805a7a83b8d103b91d0b243b9cd0f2a22
3
+ size 1175
lora_emb_conv1d/0.6.2/README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ ---
4
+
5
+ # Model Card for Model ID
6
+
7
+ <!-- Provide a quick summary of what the model is/does. -->
8
+
9
+
10
+
11
+ ## Model Details
12
+
13
+ ### Model Description
14
+
15
+ <!-- Provide a longer summary of what this model is. -->
16
+
17
+
18
+
19
+ - **Developed by:** [More Information Needed]
20
+ - **Shared by [optional]:** [More Information Needed]
21
+ - **Model type:** [More Information Needed]
22
+ - **Language(s) (NLP):** [More Information Needed]
23
+ - **License:** [More Information Needed]
24
+ - **Finetuned from model [optional]:** [More Information Needed]
25
+
26
+ ### Model Sources [optional]
27
+
28
+ <!-- Provide the basic links for the model. -->
29
+
30
+ - **Repository:** [More Information Needed]
31
+ - **Paper [optional]:** [More Information Needed]
32
+ - **Demo [optional]:** [More Information Needed]
33
+
34
+ ## Uses
35
+
36
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
37
+
38
+ ### Direct Use
39
+
40
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
41
+
42
+ [More Information Needed]
43
+
44
+ ### Downstream Use [optional]
45
+
46
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
47
+
48
+ [More Information Needed]
49
+
50
+ ### Out-of-Scope Use
51
+
52
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
53
+
54
+ [More Information Needed]
55
+
56
+ ## Bias, Risks, and Limitations
57
+
58
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
59
+
60
+ [More Information Needed]
61
+
62
+ ### Recommendations
63
+
64
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
65
+
66
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
67
+
68
+ ## How to Get Started with the Model
69
+
70
+ Use the code below to get started with the model.
71
+
72
+ [More Information Needed]
73
+
74
+ ## Training Details
75
+
76
+ ### Training Data
77
+
78
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
79
+
80
+ [More Information Needed]
81
+
82
+ ### Training Procedure
83
+
84
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
85
+
86
+ #### Preprocessing [optional]
87
+
88
+ [More Information Needed]
89
+
90
+
91
+ #### Training Hyperparameters
92
+
93
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
94
+
95
+ #### Speeds, Sizes, Times [optional]
96
+
97
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
98
+
99
+ [More Information Needed]
100
+
101
+ ## Evaluation
102
+
103
+ <!-- This section describes the evaluation protocols and provides the results. -->
104
+
105
+ ### Testing Data, Factors & Metrics
106
+
107
+ #### Testing Data
108
+
109
+ <!-- This should link to a Data Card if possible. -->
110
+
111
+ [More Information Needed]
112
+
113
+ #### Factors
114
+
115
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
116
+
117
+ [More Information Needed]
118
+
119
+ #### Metrics
120
+
121
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
122
+
123
+ [More Information Needed]
124
+
125
+ ### Results
126
+
127
+ [More Information Needed]
128
+
129
+ #### Summary
130
+
131
+
132
+
133
+ ## Model Examination [optional]
134
+
135
+ <!-- Relevant interpretability work for the model goes here -->
136
+
137
+ [More Information Needed]
138
+
139
+ ## Environmental Impact
140
+
141
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
142
+
143
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
144
+
145
+ - **Hardware Type:** [More Information Needed]
146
+ - **Hours used:** [More Information Needed]
147
+ - **Cloud Provider:** [More Information Needed]
148
+ - **Compute Region:** [More Information Needed]
149
+ - **Carbon Emitted:** [More Information Needed]
150
+
151
+ ## Technical Specifications [optional]
152
+
153
+ ### Model Architecture and Objective
154
+
155
+ [More Information Needed]
156
+
157
+ ### Compute Infrastructure
158
+
159
+ [More Information Needed]
160
+
161
+ #### Hardware
162
+
163
+ [More Information Needed]
164
+
165
+ #### Software
166
+
167
+ [More Information Needed]
168
+
169
+ ## Citation [optional]
170
+
171
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
172
+
173
+ **BibTeX:**
174
+
175
+ [More Information Needed]
176
+
177
+ **APA:**
178
+
179
+ [More Information Needed]
180
+
181
+ ## Glossary [optional]
182
+
183
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
184
+
185
+ [More Information Needed]
186
+
187
+ ## More Information [optional]
188
+
189
+ [More Information Needed]
190
+
191
+ ## Model Card Authors [optional]
192
+
193
+ [More Information Needed]
194
+
195
+ ## Model Card Contact
196
+
197
+ [More Information Needed]
198
+
199
+
200
+ ## Training procedure
201
+
202
+
203
+ ### Framework versions
204
+
205
+
206
+ - PEFT 0.6.2
lora_emb_conv1d/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "ModelEmbConv1D",
5
+ "parent_library": "test_regression"
6
+ },
7
+ "base_model_name_or_path": null,
8
+ "bias": "none",
9
+ "fan_in_fan_out": true,
10
+ "inference_mode": true,
11
+ "init_lora_weights": false,
12
+ "layers_pattern": null,
13
+ "layers_to_transform": null,
14
+ "lora_alpha": 8,
15
+ "lora_dropout": 0.0,
16
+ "modules_to_save": null,
17
+ "peft_type": "LORA",
18
+ "r": 8,
19
+ "rank_pattern": {},
20
+ "revision": null,
21
+ "target_modules": [
22
+ "emb",
23
+ "conv1d"
24
+ ],
25
+ "task_type": null
26
+ }
lora_emb_conv1d/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d1b535c7c7b3338f55c6c5b085b61d353d2a413f258bf6c4c05d5c8e6e00534
3
+ size 3976
lora_emb_conv1d/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7587645064a53bf568a92ecbc0e5f6f90fe84aa46c35402287b5d7bae3b4a015
3
+ size 1239
lora_mlp/0.6.2/README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ ---
4
+
5
+ # Model Card for Model ID
6
+
7
+ <!-- Provide a quick summary of what the model is/does. -->
8
+
9
+
10
+
11
+ ## Model Details
12
+
13
+ ### Model Description
14
+
15
+ <!-- Provide a longer summary of what this model is. -->
16
+
17
+
18
+
19
+ - **Developed by:** [More Information Needed]
20
+ - **Shared by [optional]:** [More Information Needed]
21
+ - **Model type:** [More Information Needed]
22
+ - **Language(s) (NLP):** [More Information Needed]
23
+ - **License:** [More Information Needed]
24
+ - **Finetuned from model [optional]:** [More Information Needed]
25
+
26
+ ### Model Sources [optional]
27
+
28
+ <!-- Provide the basic links for the model. -->
29
+
30
+ - **Repository:** [More Information Needed]
31
+ - **Paper [optional]:** [More Information Needed]
32
+ - **Demo [optional]:** [More Information Needed]
33
+
34
+ ## Uses
35
+
36
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
37
+
38
+ ### Direct Use
39
+
40
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
41
+
42
+ [More Information Needed]
43
+
44
+ ### Downstream Use [optional]
45
+
46
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
47
+
48
+ [More Information Needed]
49
+
50
+ ### Out-of-Scope Use
51
+
52
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
53
+
54
+ [More Information Needed]
55
+
56
+ ## Bias, Risks, and Limitations
57
+
58
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
59
+
60
+ [More Information Needed]
61
+
62
+ ### Recommendations
63
+
64
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
65
+
66
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
67
+
68
+ ## How to Get Started with the Model
69
+
70
+ Use the code below to get started with the model.
71
+
72
+ [More Information Needed]
73
+
74
+ ## Training Details
75
+
76
+ ### Training Data
77
+
78
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
79
+
80
+ [More Information Needed]
81
+
82
+ ### Training Procedure
83
+
84
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
85
+
86
+ #### Preprocessing [optional]
87
+
88
+ [More Information Needed]
89
+
90
+
91
+ #### Training Hyperparameters
92
+
93
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
94
+
95
+ #### Speeds, Sizes, Times [optional]
96
+
97
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
98
+
99
+ [More Information Needed]
100
+
101
+ ## Evaluation
102
+
103
+ <!-- This section describes the evaluation protocols and provides the results. -->
104
+
105
+ ### Testing Data, Factors & Metrics
106
+
107
+ #### Testing Data
108
+
109
+ <!-- This should link to a Data Card if possible. -->
110
+
111
+ [More Information Needed]
112
+
113
+ #### Factors
114
+
115
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
116
+
117
+ [More Information Needed]
118
+
119
+ #### Metrics
120
+
121
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
122
+
123
+ [More Information Needed]
124
+
125
+ ### Results
126
+
127
+ [More Information Needed]
128
+
129
+ #### Summary
130
+
131
+
132
+
133
+ ## Model Examination [optional]
134
+
135
+ <!-- Relevant interpretability work for the model goes here -->
136
+
137
+ [More Information Needed]
138
+
139
+ ## Environmental Impact
140
+
141
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
142
+
143
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
144
+
145
+ - **Hardware Type:** [More Information Needed]
146
+ - **Hours used:** [More Information Needed]
147
+ - **Cloud Provider:** [More Information Needed]
148
+ - **Compute Region:** [More Information Needed]
149
+ - **Carbon Emitted:** [More Information Needed]
150
+
151
+ ## Technical Specifications [optional]
152
+
153
+ ### Model Architecture and Objective
154
+
155
+ [More Information Needed]
156
+
157
+ ### Compute Infrastructure
158
+
159
+ [More Information Needed]
160
+
161
+ #### Hardware
162
+
163
+ [More Information Needed]
164
+
165
+ #### Software
166
+
167
+ [More Information Needed]
168
+
169
+ ## Citation [optional]
170
+
171
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
172
+
173
+ **BibTeX:**
174
+
175
+ [More Information Needed]
176
+
177
+ **APA:**
178
+
179
+ [More Information Needed]
180
+
181
+ ## Glossary [optional]
182
+
183
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
184
+
185
+ [More Information Needed]
186
+
187
+ ## More Information [optional]
188
+
189
+ [More Information Needed]
190
+
191
+ ## Model Card Authors [optional]
192
+
193
+ [More Information Needed]
194
+
195
+ ## Model Card Contact
196
+
197
+ [More Information Needed]
198
+
199
+
200
+ ## Training procedure
201
+
202
+
203
+ ### Framework versions
204
+
205
+
206
+ - PEFT 0.6.2
lora_mlp/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "MLP",
5
+ "parent_library": "test_regression"
6
+ },
7
+ "base_model_name_or_path": null,
8
+ "bias": "none",
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": false,
12
+ "layers_pattern": null,
13
+ "layers_to_transform": null,
14
+ "lora_alpha": 8,
15
+ "lora_dropout": 0.0,
16
+ "modules_to_save": null,
17
+ "peft_type": "LORA",
18
+ "r": 8,
19
+ "rank_pattern": {},
20
+ "revision": null,
21
+ "target_modules": [
22
+ "lin0"
23
+ ],
24
+ "task_type": null
25
+ }
lora_mlp/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dd16d2ccf171be88c29650a5780635f0418d21e8c74f7e4e919c3498e74d6a0
3
+ size 1192
lora_mlp/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50bcd27616ca78b6a55df1f21901d25ff81b4bcc4b8633e9de5456be9e76ede2
3
+ size 1239
lora_mlp_modules_to_save/0.6.2/README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ ---
4
+
5
+ # Model Card for Model ID
6
+
7
+ <!-- Provide a quick summary of what the model is/does. -->
8
+
9
+
10
+
11
+ ## Model Details
12
+
13
+ ### Model Description
14
+
15
+ <!-- Provide a longer summary of what this model is. -->
16
+
17
+
18
+
19
+ - **Developed by:** [More Information Needed]
20
+ - **Shared by [optional]:** [More Information Needed]
21
+ - **Model type:** [More Information Needed]
22
+ - **Language(s) (NLP):** [More Information Needed]
23
+ - **License:** [More Information Needed]
24
+ - **Finetuned from model [optional]:** [More Information Needed]
25
+
26
+ ### Model Sources [optional]
27
+
28
+ <!-- Provide the basic links for the model. -->
29
+
30
+ - **Repository:** [More Information Needed]
31
+ - **Paper [optional]:** [More Information Needed]
32
+ - **Demo [optional]:** [More Information Needed]
33
+
34
+ ## Uses
35
+
36
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
37
+
38
+ ### Direct Use
39
+
40
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
41
+
42
+ [More Information Needed]
43
+
44
+ ### Downstream Use [optional]
45
+
46
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
47
+
48
+ [More Information Needed]
49
+
50
+ ### Out-of-Scope Use
51
+
52
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
53
+
54
+ [More Information Needed]
55
+
56
+ ## Bias, Risks, and Limitations
57
+
58
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
59
+
60
+ [More Information Needed]
61
+
62
+ ### Recommendations
63
+
64
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
65
+
66
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
67
+
68
+ ## How to Get Started with the Model
69
+
70
+ Use the code below to get started with the model.
71
+
72
+ [More Information Needed]
73
+
74
+ ## Training Details
75
+
76
+ ### Training Data
77
+
78
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
79
+
80
+ [More Information Needed]
81
+
82
+ ### Training Procedure
83
+
84
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
85
+
86
+ #### Preprocessing [optional]
87
+
88
+ [More Information Needed]
89
+
90
+
91
+ #### Training Hyperparameters
92
+
93
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
94
+
95
+ #### Speeds, Sizes, Times [optional]
96
+
97
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
98
+
99
+ [More Information Needed]
100
+
101
+ ## Evaluation
102
+
103
+ <!-- This section describes the evaluation protocols and provides the results. -->
104
+
105
+ ### Testing Data, Factors & Metrics
106
+
107
+ #### Testing Data
108
+
109
+ <!-- This should link to a Data Card if possible. -->
110
+
111
+ [More Information Needed]
112
+
113
+ #### Factors
114
+
115
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
116
+
117
+ [More Information Needed]
118
+
119
+ #### Metrics
120
+
121
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
122
+
123
+ [More Information Needed]
124
+
125
+ ### Results
126
+
127
+ [More Information Needed]
128
+
129
+ #### Summary
130
+
131
+
132
+
133
+ ## Model Examination [optional]
134
+
135
+ <!-- Relevant interpretability work for the model goes here -->
136
+
137
+ [More Information Needed]
138
+
139
+ ## Environmental Impact
140
+
141
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
142
+
143
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
144
+
145
+ - **Hardware Type:** [More Information Needed]
146
+ - **Hours used:** [More Information Needed]
147
+ - **Cloud Provider:** [More Information Needed]
148
+ - **Compute Region:** [More Information Needed]
149
+ - **Carbon Emitted:** [More Information Needed]
150
+
151
+ ## Technical Specifications [optional]
152
+
153
+ ### Model Architecture and Objective
154
+
155
+ [More Information Needed]
156
+
157
+ ### Compute Infrastructure
158
+
159
+ [More Information Needed]
160
+
161
+ #### Hardware
162
+
163
+ [More Information Needed]
164
+
165
+ #### Software
166
+
167
+ [More Information Needed]
168
+
169
+ ## Citation [optional]
170
+
171
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
172
+
173
+ **BibTeX:**
174
+
175
+ [More Information Needed]
176
+
177
+ **APA:**
178
+
179
+ [More Information Needed]
180
+
181
+ ## Glossary [optional]
182
+
183
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
184
+
185
+ [More Information Needed]
186
+
187
+ ## More Information [optional]
188
+
189
+ [More Information Needed]
190
+
191
+ ## Model Card Authors [optional]
192
+
193
+ [More Information Needed]
194
+
195
+ ## Model Card Contact
196
+
197
+ [More Information Needed]
198
+
199
+
200
+ ## Training procedure
201
+
202
+
203
+ ### Framework versions
204
+
205
+
206
+ - PEFT 0.6.2
lora_mlp_modules_to_save/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "MLP",
5
+ "parent_library": "test_regression"
6
+ },
7
+ "base_model_name_or_path": null,
8
+ "bias": "none",
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": false,
12
+ "layers_pattern": null,
13
+ "layers_to_transform": null,
14
+ "lora_alpha": 8,
15
+ "lora_dropout": 0.0,
16
+ "modules_to_save": [
17
+ "lin1"
18
+ ],
19
+ "peft_type": "LORA",
20
+ "r": 8,
21
+ "rank_pattern": {},
22
+ "revision": null,
23
+ "target_modules": [
24
+ "lin0"
25
+ ],
26
+ "task_type": null
27
+ }
lora_mlp_modules_to_save/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c1939cb8cb41a8bb5f05238d37aa77d18d96d1d7a9d3afa6d6ff2d2ef9805ea
3
+ size 1528
lora_mlp_modules_to_save/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50bcd27616ca78b6a55df1f21901d25ff81b4bcc4b8633e9de5456be9e76ede2
3
+ size 1239
lora_opt-350m/0.6.2/README.md ADDED
@@ -0,0 +1,207 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ base_model: facebook/opt-350m
4
+ ---
5
+
6
+ # Model Card for Model ID
7
+
8
+ <!-- Provide a quick summary of what the model is/does. -->
9
+
10
+
11
+
12
+ ## Model Details
13
+
14
+ ### Model Description
15
+
16
+ <!-- Provide a longer summary of what this model is. -->
17
+
18
+
19
+
20
+ - **Developed by:** [More Information Needed]
21
+ - **Shared by [optional]:** [More Information Needed]
22
+ - **Model type:** [More Information Needed]
23
+ - **Language(s) (NLP):** [More Information Needed]
24
+ - **License:** [More Information Needed]
25
+ - **Finetuned from model [optional]:** [More Information Needed]
26
+
27
+ ### Model Sources [optional]
28
+
29
+ <!-- Provide the basic links for the model. -->
30
+
31
+ - **Repository:** [More Information Needed]
32
+ - **Paper [optional]:** [More Information Needed]
33
+ - **Demo [optional]:** [More Information Needed]
34
+
35
+ ## Uses
36
+
37
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
38
+
39
+ ### Direct Use
40
+
41
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
42
+
43
+ [More Information Needed]
44
+
45
+ ### Downstream Use [optional]
46
+
47
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
48
+
49
+ [More Information Needed]
50
+
51
+ ### Out-of-Scope Use
52
+
53
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
54
+
55
+ [More Information Needed]
56
+
57
+ ## Bias, Risks, and Limitations
58
+
59
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
60
+
61
+ [More Information Needed]
62
+
63
+ ### Recommendations
64
+
65
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
66
+
67
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
68
+
69
+ ## How to Get Started with the Model
70
+
71
+ Use the code below to get started with the model.
72
+
73
+ [More Information Needed]
74
+
75
+ ## Training Details
76
+
77
+ ### Training Data
78
+
79
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
80
+
81
+ [More Information Needed]
82
+
83
+ ### Training Procedure
84
+
85
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
86
+
87
+ #### Preprocessing [optional]
88
+
89
+ [More Information Needed]
90
+
91
+
92
+ #### Training Hyperparameters
93
+
94
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
95
+
96
+ #### Speeds, Sizes, Times [optional]
97
+
98
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
99
+
100
+ [More Information Needed]
101
+
102
+ ## Evaluation
103
+
104
+ <!-- This section describes the evaluation protocols and provides the results. -->
105
+
106
+ ### Testing Data, Factors & Metrics
107
+
108
+ #### Testing Data
109
+
110
+ <!-- This should link to a Data Card if possible. -->
111
+
112
+ [More Information Needed]
113
+
114
+ #### Factors
115
+
116
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
117
+
118
+ [More Information Needed]
119
+
120
+ #### Metrics
121
+
122
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
123
+
124
+ [More Information Needed]
125
+
126
+ ### Results
127
+
128
+ [More Information Needed]
129
+
130
+ #### Summary
131
+
132
+
133
+
134
+ ## Model Examination [optional]
135
+
136
+ <!-- Relevant interpretability work for the model goes here -->
137
+
138
+ [More Information Needed]
139
+
140
+ ## Environmental Impact
141
+
142
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
143
+
144
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
145
+
146
+ - **Hardware Type:** [More Information Needed]
147
+ - **Hours used:** [More Information Needed]
148
+ - **Cloud Provider:** [More Information Needed]
149
+ - **Compute Region:** [More Information Needed]
150
+ - **Carbon Emitted:** [More Information Needed]
151
+
152
+ ## Technical Specifications [optional]
153
+
154
+ ### Model Architecture and Objective
155
+
156
+ [More Information Needed]
157
+
158
+ ### Compute Infrastructure
159
+
160
+ [More Information Needed]
161
+
162
+ #### Hardware
163
+
164
+ [More Information Needed]
165
+
166
+ #### Software
167
+
168
+ [More Information Needed]
169
+
170
+ ## Citation [optional]
171
+
172
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
173
+
174
+ **BibTeX:**
175
+
176
+ [More Information Needed]
177
+
178
+ **APA:**
179
+
180
+ [More Information Needed]
181
+
182
+ ## Glossary [optional]
183
+
184
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
185
+
186
+ [More Information Needed]
187
+
188
+ ## More Information [optional]
189
+
190
+ [More Information Needed]
191
+
192
+ ## Model Card Authors [optional]
193
+
194
+ [More Information Needed]
195
+
196
+ ## Model Card Contact
197
+
198
+ [More Information Needed]
199
+
200
+
201
+ ## Training procedure
202
+
203
+
204
+ ### Framework versions
205
+
206
+
207
+ - PEFT 0.6.2
lora_opt-350m/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "OPTForCausalLM",
5
+ "parent_library": "transformers.models.opt.modeling_opt"
6
+ },
7
+ "base_model_name_or_path": "facebook/opt-350m",
8
+ "bias": "none",
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": false,
12
+ "layers_pattern": null,
13
+ "layers_to_transform": null,
14
+ "lora_alpha": 8,
15
+ "lora_dropout": 0.0,
16
+ "modules_to_save": null,
17
+ "peft_type": "LORA",
18
+ "r": 8,
19
+ "rank_pattern": {},
20
+ "revision": null,
21
+ "target_modules": [
22
+ "q_proj",
23
+ "v_proj"
24
+ ],
25
+ "task_type": null
26
+ }
lora_opt-350m/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82751e30bebc19cbfa01212631d08c7032fc3a75996dadf4da1d29298fdd736f
3
+ size 3159096
lora_opt-350m/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:788d8589a3e462ff482ff8926366f18b4bcf9c1d6af2bb1158eff483668645ef
3
+ size 1207639
lora_opt-350m_bnb_4bit/0.6.2/README.md ADDED
@@ -0,0 +1,219 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ base_model: facebook/opt-350m
4
+ ---
5
+
6
+ # Model Card for Model ID
7
+
8
+ <!-- Provide a quick summary of what the model is/does. -->
9
+
10
+
11
+
12
+ ## Model Details
13
+
14
+ ### Model Description
15
+
16
+ <!-- Provide a longer summary of what this model is. -->
17
+
18
+
19
+
20
+ - **Developed by:** [More Information Needed]
21
+ - **Shared by [optional]:** [More Information Needed]
22
+ - **Model type:** [More Information Needed]
23
+ - **Language(s) (NLP):** [More Information Needed]
24
+ - **License:** [More Information Needed]
25
+ - **Finetuned from model [optional]:** [More Information Needed]
26
+
27
+ ### Model Sources [optional]
28
+
29
+ <!-- Provide the basic links for the model. -->
30
+
31
+ - **Repository:** [More Information Needed]
32
+ - **Paper [optional]:** [More Information Needed]
33
+ - **Demo [optional]:** [More Information Needed]
34
+
35
+ ## Uses
36
+
37
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
38
+
39
+ ### Direct Use
40
+
41
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
42
+
43
+ [More Information Needed]
44
+
45
+ ### Downstream Use [optional]
46
+
47
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
48
+
49
+ [More Information Needed]
50
+
51
+ ### Out-of-Scope Use
52
+
53
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
54
+
55
+ [More Information Needed]
56
+
57
+ ## Bias, Risks, and Limitations
58
+
59
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
60
+
61
+ [More Information Needed]
62
+
63
+ ### Recommendations
64
+
65
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
66
+
67
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
68
+
69
+ ## How to Get Started with the Model
70
+
71
+ Use the code below to get started with the model.
72
+
73
+ [More Information Needed]
74
+
75
+ ## Training Details
76
+
77
+ ### Training Data
78
+
79
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
80
+
81
+ [More Information Needed]
82
+
83
+ ### Training Procedure
84
+
85
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
86
+
87
+ #### Preprocessing [optional]
88
+
89
+ [More Information Needed]
90
+
91
+
92
+ #### Training Hyperparameters
93
+
94
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
95
+
96
+ #### Speeds, Sizes, Times [optional]
97
+
98
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
99
+
100
+ [More Information Needed]
101
+
102
+ ## Evaluation
103
+
104
+ <!-- This section describes the evaluation protocols and provides the results. -->
105
+
106
+ ### Testing Data, Factors & Metrics
107
+
108
+ #### Testing Data
109
+
110
+ <!-- This should link to a Data Card if possible. -->
111
+
112
+ [More Information Needed]
113
+
114
+ #### Factors
115
+
116
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
117
+
118
+ [More Information Needed]
119
+
120
+ #### Metrics
121
+
122
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
123
+
124
+ [More Information Needed]
125
+
126
+ ### Results
127
+
128
+ [More Information Needed]
129
+
130
+ #### Summary
131
+
132
+
133
+
134
+ ## Model Examination [optional]
135
+
136
+ <!-- Relevant interpretability work for the model goes here -->
137
+
138
+ [More Information Needed]
139
+
140
+ ## Environmental Impact
141
+
142
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
143
+
144
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
145
+
146
+ - **Hardware Type:** [More Information Needed]
147
+ - **Hours used:** [More Information Needed]
148
+ - **Cloud Provider:** [More Information Needed]
149
+ - **Compute Region:** [More Information Needed]
150
+ - **Carbon Emitted:** [More Information Needed]
151
+
152
+ ## Technical Specifications [optional]
153
+
154
+ ### Model Architecture and Objective
155
+
156
+ [More Information Needed]
157
+
158
+ ### Compute Infrastructure
159
+
160
+ [More Information Needed]
161
+
162
+ #### Hardware
163
+
164
+ [More Information Needed]
165
+
166
+ #### Software
167
+
168
+ [More Information Needed]
169
+
170
+ ## Citation [optional]
171
+
172
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
173
+
174
+ **BibTeX:**
175
+
176
+ [More Information Needed]
177
+
178
+ **APA:**
179
+
180
+ [More Information Needed]
181
+
182
+ ## Glossary [optional]
183
+
184
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
185
+
186
+ [More Information Needed]
187
+
188
+ ## More Information [optional]
189
+
190
+ [More Information Needed]
191
+
192
+ ## Model Card Authors [optional]
193
+
194
+ [More Information Needed]
195
+
196
+ ## Model Card Contact
197
+
198
+ [More Information Needed]
199
+
200
+
201
+ ## Training procedure
202
+
203
+
204
+ The following `bitsandbytes` quantization config was used during training:
205
+ - quant_method: bitsandbytes
206
+ - load_in_8bit: False
207
+ - load_in_4bit: True
208
+ - llm_int8_threshold: 6.0
209
+ - llm_int8_skip_modules: None
210
+ - llm_int8_enable_fp32_cpu_offload: False
211
+ - llm_int8_has_fp16_weight: False
212
+ - bnb_4bit_quant_type: fp4
213
+ - bnb_4bit_use_double_quant: False
214
+ - bnb_4bit_compute_dtype: float32
215
+
216
+ ### Framework versions
217
+
218
+
219
+ - PEFT 0.6.2
lora_opt-350m_bnb_4bit/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "OPTForCausalLM",
5
+ "parent_library": "transformers.models.opt.modeling_opt"
6
+ },
7
+ "base_model_name_or_path": "facebook/opt-350m",
8
+ "bias": "none",
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": false,
12
+ "layers_pattern": null,
13
+ "layers_to_transform": null,
14
+ "lora_alpha": 8,
15
+ "lora_dropout": 0.0,
16
+ "modules_to_save": null,
17
+ "peft_type": "LORA",
18
+ "r": 8,
19
+ "rank_pattern": {},
20
+ "revision": null,
21
+ "target_modules": [
22
+ "q_proj",
23
+ "v_proj"
24
+ ],
25
+ "task_type": null
26
+ }
lora_opt-350m_bnb_4bit/0.6.2/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ece009e7ac28447a45cef4a37c5a4a0048b5a5b12261e37464fa762771b94a86
3
+ size 3159096
lora_opt-350m_bnb_4bit/0.6.2/output.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00942ada33ef2fcbe9621268e1cce8c59aeeb71dd1c79101498d00c1881f07f5
3
+ size 1207639
lora_opt-350m_bnb_8bit/0.6.2/README.md ADDED
@@ -0,0 +1,219 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ base_model: facebook/opt-350m
4
+ ---
5
+
6
+ # Model Card for Model ID
7
+
8
+ <!-- Provide a quick summary of what the model is/does. -->
9
+
10
+
11
+
12
+ ## Model Details
13
+
14
+ ### Model Description
15
+
16
+ <!-- Provide a longer summary of what this model is. -->
17
+
18
+
19
+
20
+ - **Developed by:** [More Information Needed]
21
+ - **Shared by [optional]:** [More Information Needed]
22
+ - **Model type:** [More Information Needed]
23
+ - **Language(s) (NLP):** [More Information Needed]
24
+ - **License:** [More Information Needed]
25
+ - **Finetuned from model [optional]:** [More Information Needed]
26
+
27
+ ### Model Sources [optional]
28
+
29
+ <!-- Provide the basic links for the model. -->
30
+
31
+ - **Repository:** [More Information Needed]
32
+ - **Paper [optional]:** [More Information Needed]
33
+ - **Demo [optional]:** [More Information Needed]
34
+
35
+ ## Uses
36
+
37
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
38
+
39
+ ### Direct Use
40
+
41
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
42
+
43
+ [More Information Needed]
44
+
45
+ ### Downstream Use [optional]
46
+
47
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
48
+
49
+ [More Information Needed]
50
+
51
+ ### Out-of-Scope Use
52
+
53
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
54
+
55
+ [More Information Needed]
56
+
57
+ ## Bias, Risks, and Limitations
58
+
59
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
60
+
61
+ [More Information Needed]
62
+
63
+ ### Recommendations
64
+
65
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
66
+
67
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
68
+
69
+ ## How to Get Started with the Model
70
+
71
+ Use the code below to get started with the model.
72
+
73
+ [More Information Needed]
74
+
75
+ ## Training Details
76
+
77
+ ### Training Data
78
+
79
+ <!-- This should link to a Data Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
80
+
81
+ [More Information Needed]
82
+
83
+ ### Training Procedure
84
+
85
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
86
+
87
+ #### Preprocessing [optional]
88
+
89
+ [More Information Needed]
90
+
91
+
92
+ #### Training Hyperparameters
93
+
94
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
95
+
96
+ #### Speeds, Sizes, Times [optional]
97
+
98
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
99
+
100
+ [More Information Needed]
101
+
102
+ ## Evaluation
103
+
104
+ <!-- This section describes the evaluation protocols and provides the results. -->
105
+
106
+ ### Testing Data, Factors & Metrics
107
+
108
+ #### Testing Data
109
+
110
+ <!-- This should link to a Data Card if possible. -->
111
+
112
+ [More Information Needed]
113
+
114
+ #### Factors
115
+
116
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
117
+
118
+ [More Information Needed]
119
+
120
+ #### Metrics
121
+
122
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
123
+
124
+ [More Information Needed]
125
+
126
+ ### Results
127
+
128
+ [More Information Needed]
129
+
130
+ #### Summary
131
+
132
+
133
+
134
+ ## Model Examination [optional]
135
+
136
+ <!-- Relevant interpretability work for the model goes here -->
137
+
138
+ [More Information Needed]
139
+
140
+ ## Environmental Impact
141
+
142
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
143
+
144
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
145
+
146
+ - **Hardware Type:** [More Information Needed]
147
+ - **Hours used:** [More Information Needed]
148
+ - **Cloud Provider:** [More Information Needed]
149
+ - **Compute Region:** [More Information Needed]
150
+ - **Carbon Emitted:** [More Information Needed]
151
+
152
+ ## Technical Specifications [optional]
153
+
154
+ ### Model Architecture and Objective
155
+
156
+ [More Information Needed]
157
+
158
+ ### Compute Infrastructure
159
+
160
+ [More Information Needed]
161
+
162
+ #### Hardware
163
+
164
+ [More Information Needed]
165
+
166
+ #### Software
167
+
168
+ [More Information Needed]
169
+
170
+ ## Citation [optional]
171
+
172
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
173
+
174
+ **BibTeX:**
175
+
176
+ [More Information Needed]
177
+
178
+ **APA:**
179
+
180
+ [More Information Needed]
181
+
182
+ ## Glossary [optional]
183
+
184
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
185
+
186
+ [More Information Needed]
187
+
188
+ ## More Information [optional]
189
+
190
+ [More Information Needed]
191
+
192
+ ## Model Card Authors [optional]
193
+
194
+ [More Information Needed]
195
+
196
+ ## Model Card Contact
197
+
198
+ [More Information Needed]
199
+
200
+
201
+ ## Training procedure
202
+
203
+
204
+ The following `bitsandbytes` quantization config was used during training:
205
+ - quant_method: bitsandbytes
206
+ - load_in_8bit: True
207
+ - load_in_4bit: False
208
+ - llm_int8_threshold: 6.0
209
+ - llm_int8_skip_modules: None
210
+ - llm_int8_enable_fp32_cpu_offload: False
211
+ - llm_int8_has_fp16_weight: False
212
+ - bnb_4bit_quant_type: fp4
213
+ - bnb_4bit_use_double_quant: False
214
+ - bnb_4bit_compute_dtype: float32
215
+
216
+ ### Framework versions
217
+
218
+
219
+ - PEFT 0.6.2
lora_opt-350m_bnb_8bit/0.6.2/adapter_config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "OPTForCausalLM",
5
+ "parent_library": "transformers.models.opt.modeling_opt"
6
+ },
7
+ "base_model_name_or_path": "facebook/opt-350m",
8
+ "bias": "none",
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": false,
12
+ "layers_pattern": null,
13
+ "layers_to_transform": null,
14
+ "lora_alpha": 8,
15
+ "lora_dropout": 0.0,
16
+ "modules_to_save": null,
17
+ "peft_type": "LORA",
18
+ "r": 8,
19
+ "rank_pattern": {},
20
+ "revision": null,
21
+ "target_modules": [
22
+ "q_proj",
23
+ "v_proj"
24
+ ],
25
+ "task_type": null
26
+ }