cedricwhitney commited on
Commit
f0d479a
β€’
1 Parent(s): 57937bf

Create smolVLM

Browse files
Files changed (1) hide show
  1. model_data/smolVLM +374 -0
model_data/smolVLM ADDED
@@ -0,0 +1,374 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "Name": "SmolVLM",
4
+ "Provider": "Hugging Face",
5
+ "URL": "https://huggingface.co/HuggingFaceTB/SmolVLM",
6
+ "Type": "Vision-Language Model",
7
+ "Modalities": [
8
+ "Text-to-Text",
9
+ "Image-to-Text"
10
+ ]
11
+ },
12
+ "scores": {
13
+ "1. Bias, Stereotypes, and Representational Harms Evaluation": {
14
+ "1.1 Bias Detection Overview": {
15
+ "status": "No",
16
+ "sources": [],
17
+ "questions": {
18
+ "Evaluations at various stages (data collection, preprocessing, AI system architecture, training, deployment)": false,
19
+ "Have intrinsic properties of the AI system been evaluated for bias (e.g., embedding analysis)": false,
20
+ "Have extrinsic bias evaluations been run (e.g., downstream task performance)": false,
21
+ "Have evaluations been run across all applicable modalities": false,
22
+ "Have bias evaluations been run that take the form of automatic quantitative evaluation": false,
23
+ "Have bias evaluations been run with human participants?": false
24
+ }
25
+ },
26
+ "1.2 Protected Classes and Intersectional Measures": {
27
+ "status": "No",
28
+ "sources": [],
29
+ "questions": {
30
+ "Do evaluations cover all applicable legal protected categories for in-scope uses of the system?": false,
31
+ "Do evaluations cover additional subgroups that are likely to be harmed based on other personal characteristics": false,
32
+ "Evaluation of how different aspects of identity interact and compound in AI system behavior": false,
33
+ "Evaluation of AI system biases for legal protected categories and additional relevant subgroups": false
34
+ }
35
+ },
36
+ "1.3 Measurement of Stereotypes and Harmful Associations": {
37
+ "status": "No",
38
+ "sources": [],
39
+ "questions": {
40
+ "Measurement of known stereotypes in AI system outputs": false,
41
+ "Measurement of other negative associations and assumptions regarding specific groups": false,
42
+ "Measurement of stereotypes and negative associations across in-scope contexts": false
43
+ }
44
+ },
45
+ "1.4 Bias Evaluation Transparency and Documentation": {
46
+ "status": "No",
47
+ "sources": [],
48
+ "questions": {
49
+ "Sufficient documentation of evaluation method to understand the scope of the findings": false,
50
+ "Sufficient documentation of evaluation methods to replicate findings": false,
51
+ "Sufficient documentation of evaluation results to support comparison": false,
52
+ "Documentation of bias mitigation measures": false,
53
+ "Documentation of bias monitoring approaches": false
54
+ }
55
+ }
56
+ },
57
+ "2. Cultural Values and Sensitive Content Evaluation": {
58
+ "2.1 Cultural Variation Overview": {
59
+ "status": "No",
60
+ "sources": [],
61
+ "questions": {
62
+ "Evaluations at various stages": false,
63
+ "Have intrinsic properties been evaluated for cultural variation": false,
64
+ "Have extrinsic cultural variation evaluations been run": false,
65
+ "Have evaluations been run across all applicable modalities": false,
66
+ "Have cultural variation evaluations been run that take the form of automatic quantitative evaluation": false,
67
+ "Have cultural variation evaluations been run with human participants?": false
68
+ }
69
+ },
70
+ "2.2 Cultural Diversity and Representation": {
71
+ "status": "No",
72
+ "sources": [],
73
+ "questions": {
74
+ "Use of evaluation methods developed in the cultural contexts in scope": false,
75
+ "Respect of indigenous sovereignty, protected rights, and cultural norms": false,
76
+ "Evaluation of cultural variation across geographic dimensions": false,
77
+ "Evaluation of cultural variation representing communities' perspectives": false,
78
+ "Analysis of how cultural context affects AI system performance": false
79
+ }
80
+ },
81
+ "2.3 Generated Sensitive Content across Cultural Contexts": {
82
+ "status": "No",
83
+ "sources": [],
84
+ "questions": {
85
+ "Has the AI system been evaluated for its likelihood of facilitating generation of threatening or violent content": false,
86
+ "Has the AI system been evaluated for its likelihood of facilitating generation of targeted harassment or discrimination": false,
87
+ "Has the AI system been evaluated for its likelihood of facilitating generation of hate speech": false,
88
+ "Has the AI system been evaluated for content embedding values not reflective of user cultural context": false,
89
+ "Has the AI system been evaluated for exposing users to inappropriate content": false,
90
+ "Has the AI system been evaluated for content with negative psychological impacts": false,
91
+ "Has the evaluation explicitly addressed cultural variation": false
92
+ }
93
+ },
94
+ "2.4 Cultural Variation Transparency and Documentation": {
95
+ "status": "No",
96
+ "sources": [],
97
+ "questions": {
98
+ "Documentation of cultural contexts considered during development": false,
99
+ "Documentation of cultural contexts covered by evaluations": false,
100
+ "Sufficient documentation of evaluation method": false,
101
+ "Sufficient documentation of evaluation methods to replicate findings": false,
102
+ "Sufficient documentation of evaluation results": false,
103
+ "Documentation of psychological impact on evaluators": false,
104
+ "Documentation of evaluator well-being measures": false
105
+ }
106
+ }
107
+ },
108
+ "3. Disparate Performance": {
109
+ "3.1 Disparate Performance Overview": {
110
+ "status": "N/A",
111
+ "sources": [],
112
+ "questions": {
113
+ "Have development choices been evaluated for disparate performance contribution": false,
114
+ "Have extrinsic disparate performance evaluations been run": false,
115
+ "Have evaluations been run across all applicable modalities": false,
116
+ "Have disparate performance evaluations been run quantitatively": false,
117
+ "Have disparate performance evaluations been run with human participants": false
118
+ }
119
+ },
120
+ "3.2 Identifying Target Groups": {
121
+ "status": "N/A",
122
+ "sources": [],
123
+ "questions": {
124
+ "Identification of mandated target groups": false,
125
+ "Identification of additional potentially harmed groups": false,
126
+ "Assessment of systemic barriers in data collection": false,
127
+ "Consideration of historical disparities": false,
128
+ "Identification of implicit and explicit markers": false
129
+ }
130
+ },
131
+ "3.3 Subgroup Performance Analysis": {
132
+ "status": "N/A",
133
+ "sources": [],
134
+ "questions": {
135
+ "Non-aggregated evaluation results across subpopulations": false,
136
+ "Metrics for decision-making tasks": false,
137
+ "Metrics for other tasks including generative": false,
138
+ "Worst-case subgroup performance analysis": false,
139
+ "Intersectional analysis": false,
140
+ "Evaluation of implicit social group markers": false
141
+ }
142
+ },
143
+ "3.4 Transparency and Documentation": {
144
+ "status": "N/A",
145
+ "sources": [],
146
+ "questions": {
147
+ "Documentation of evaluation method scope": false,
148
+ "Documentation of evaluation methods for replication": false,
149
+ "Documentation of evaluation results for comparison": false,
150
+ "Documentation of mitigation measures": false,
151
+ "Documentation of monitoring approaches": false
152
+ }
153
+ }
154
+ },
155
+ "4. Environmental Costs and Carbon Emissions Evaluation": {
156
+ "4.1 Environmental Costs Overview": {
157
+ "status": "Yes",
158
+ "sources": [
159
+ {
160
+ "type": "🌐",
161
+ "detail": "https://huggingface.co/HuggingFaceTB/SmolVLM-Instruct",
162
+ "name": "Model Card"
163
+ }
164
+ ],
165
+ "questions": {
166
+ "Evaluations of different processes": false,
167
+ "Have evaluations been run across all applicable modalities?": true,
168
+ "Have evaluations been run on standardized benchmarks or metrics?": true,
169
+ "Have evaluations taken into account community feedback": false,
170
+ "Do evaluations consider the full supply chain": false
171
+ }
172
+ },
173
+ "4.2 Energy Cost and Environmental Impact of Development": {
174
+ "status": "Yes",
175
+ "sources": [
176
+ {
177
+ "type": "🌐",
178
+ "detail": "https://huggingface.co/HuggingFaceTB/SmolVLM-Instruct",
179
+ "name": "Model Card"
180
+ }
181
+ ],
182
+ "questions": {
183
+ "Accounting of FLOPS across development stages": true,
184
+ "Evaluation of energy consumption using standardized tracking tools": true,
185
+ "Evaluation of carbon impact accounting for regional energy sources": true,
186
+ "Evaluation of hardware lifecycle environmental impact": false
187
+ }
188
+ },
189
+ "4.3 Energy Cost and Environmental Impact of Deployment": {
190
+ "status": "Yes",
191
+ "sources": [
192
+ {
193
+ "type": "🌐",
194
+ "detail": "https://huggingface.co/HuggingFaceTB/SmolVLM-Instruct",
195
+ "name": "Model Card"
196
+ }
197
+ ],
198
+ "questions": {
199
+ "Evaluation of inference FLOPS": false,
200
+ "Evaluation of inference energy consumption on most common deployment setting": true,
201
+ "Evaluation of inference energy consumption on multiple deployment settings": true,
202
+ "Evaluation of task-specific energy consumption variations": false,
203
+ "Evaluation of carbon impact for deployment infrastructure": false,
204
+ "Evaluation of hardware lifecycle environmental impact for deployment": false
205
+ }
206
+ },
207
+ "4.4 Environmental Costs Transparency and Documentation": {
208
+ "status": "Yes",
209
+ "sources": [
210
+ {
211
+ "type": "🌐",
212
+ "detail": "https://huggingface.co/HuggingFaceTB/SmolVLM-Instruct",
213
+ "name": "Model Card"
214
+ }
215
+ ],
216
+ "questions": {
217
+ "Documentation about equipment and infrastructure specifications": true,
218
+ "Sufficient documentation of evaluation methods": false,
219
+ "Sufficient documentation of evaluation methods to replicate findings": true,
220
+ "Sufficient documentation of evaluation results for comparison": true
221
+ }
222
+ }
223
+ },
224
+ "5. Privacy and Data Protection Evaluation": {
225
+ "5.1 Privacy and Data Protection Overview": {
226
+ "status": "Yes",
227
+ "sources": [
228
+ {
229
+ "type": "🌐",
230
+ "detail": "https://huggingface.co/HuggingFaceTB/SmolVLM-Instruct",
231
+ "name": "Model Card"
232
+ }
233
+ ],
234
+ "questions": {
235
+ "Evaluations at various stages": true,
236
+ "Have intrinsic properties been evaluated for privacy vulnerabilities": false,
237
+ "Have extrinsic privacy evaluations been run": true,
238
+ "Have evaluations been run across all applicable modalities": true,
239
+ "Have privacy evaluations been run that take the form of automatic quantitative evaluation": true,
240
+ "Have privacy evaluations been run with human participants?": false
241
+ }
242
+ },
243
+ "5.2 Privacy, Likeness, and Publicity Harms": {
244
+ "status": "No",
245
+ "sources": [],
246
+ "questions": {
247
+ "Has the AI system been evaluated for its likelihood of revealing personal information": false,
248
+ "Has the AI system been evaluated for its likelihood of facilitating impersonation": false,
249
+ "Has the AI system been evaluated for its likelihood of providing confabulated personal information": false
250
+ }
251
+ },
252
+ "5.3 Intellectual Property and Information Security": {
253
+ "status": "No",
254
+ "sources": [],
255
+ "questions": {
256
+ "Has the AI system been evaluated for its likelihood of reproducing sensitive or copyrighted information": false,
257
+ "Has the system been evaluated for other information security risks": false
258
+ }
259
+ },
260
+ "5.4 Privacy Evaluation Transparency and Documentation": {
261
+ "status": "No",
262
+ "sources": [],
263
+ "questions": {
264
+ "Sufficient documentation of evaluation methods": false,
265
+ "Sufficient documentation of evaluation results": false,
266
+ "Documentation of evaluation limitations": false,
267
+ "Documentation of deployment considerations": false,
268
+ "Documentation of training data risk categories": false
269
+ }
270
+ }
271
+ },
272
+ "6. Financial Costs Evaluation": {
273
+ "6.1 Financial Costs Overview": {
274
+ "status": "No",
275
+ "sources": [],
276
+ "questions": {
277
+ "Evaluation of costs at various stages": false,
278
+ "Have costs been evaluated for different system components": false,
279
+ "Have cost evaluations been run across all applicable modalities": false,
280
+ "Have cost evaluations included both direct and indirect expenses": false,
281
+ "Have cost projections been validated against actual expenses": false
282
+ }
283
+ },
284
+ "6.2 Development and Training Costs": {
285
+ "status": "Yes",
286
+ "sources": [
287
+ {
288
+ "type": "🌐",
289
+ "detail": "https://huggingface.co/HuggingFaceTB/SmolVLM-Instruct",
290
+ "name": "Model Card"
291
+ }
292
+ ],
293
+ "questions": {
294
+ "Assessment of research and development labor costs": false,
295
+ "Evaluation of data collection and preprocessing costs": false,
296
+ "Assessment of training infrastructure costs": false,
297
+ "Assessment of costs associated with different training approaches": false,
298
+ "Evaluation of model architecture and size impact on costs": true
299
+ }
300
+ },
301
+ "6.3 Deployment and Operation Costs": {
302
+ "status": "Yes",
303
+ "sources": [
304
+ {
305
+ "type": "🌐",
306
+ "detail": "https://huggingface.co/HuggingFaceTB/SmolVLM-Instruct",
307
+ "name": "Model Card"
308
+ }
309
+ ],
310
+ "questions": {
311
+ "Assessment of inference and serving costs": true,
312
+ "Evaluation of storage and hosting expenses": false,
313
+ "Assessment of scaling costs": false,
314
+ "Evaluation of costs specific to different deployment contexts": false,
315
+ "Assessment of update and fine-tuning costs": false
316
+ }
317
+ },
318
+ "6.4 Financial Cost Documentation and Transparency": {
319
+ "status": "No",
320
+ "sources": [],
321
+ "questions": {
322
+ "Documentation of cost evaluation methodology": false,
323
+ "Documentation of cost breakdowns and metrics": false,
324
+ "Documentation of cost variations": false,
325
+ "Documentation of cost projections": false
326
+ }
327
+ }
328
+ },
329
+ "7. Data and Content Moderation Labor Evaluation": {
330
+ "7.1 Labor Evaluation Overview": {
331
+ "status": "No",
332
+ "sources": [],
333
+ "questions": {
334
+ "Evaluation of labor practices at various stages": false,
335
+ "Have labor conditions been evaluated for different worker categories": false,
336
+ "Have labor evaluations been run across all applicable task types": false,
337
+ "Have labor practices been evaluated against industry standards": false,
338
+ "Have labor evaluations included both direct and contracted workers": false,
339
+ "Have evaluations considered different regional contexts": false
340
+ }
341
+ },
342
+ "7.2 Working Conditions and Compensation": {
343
+ "status": "No",
344
+ "sources": [],
345
+ "questions": {
346
+ "Assessment of compensation relative to standards": false,
347
+ "Assessment of job security and classification": false,
348
+ "Evaluation of workplace safety and protections": false,
349
+ "Assessment of worker autonomy": false,
350
+ "Evaluation of power dynamics": false
351
+ }
352
+ },
353
+ "7.3 Worker Wellbeing and Support": {
354
+ "status": "No",
355
+ "sources": [],
356
+ "questions": {
357
+ "Assessment of psychological support systems": false,
358
+ "Evaluation of content preparation and exposure limits": false,
359
+ "Evaluation of cultural and linguistic support": false
360
+ }
361
+ },
362
+ "7.4 Labor Practice Documentation and Transparency": {
363
+ "status": "No",
364
+ "sources": [],
365
+ "questions": {
366
+ "Documentation of evaluation methodology": false,
367
+ "Documentation of worker demographics": false,
368
+ "Documentation of support systems": false,
369
+ "Documentation of incident reporting procedures": false
370
+ }
371
+ }
372
+ }
373
+ }
374
+ }