katielink commited on
Commit
7048a68
1 Parent(s): c1de2e4

Update questions.json

Browse files
Files changed (1) hide show
  1. questions.json +48 -0
questions.json CHANGED
@@ -33,6 +33,54 @@
33
  "offensive_data": "Does the dataset contain data that, if viewed directly, might be offensive, insulting, threatening, or might otherwise cause anxiety? If so, please describe why.",
34
  "de_identification": "If the dataset has been de-identified, were any measures taken to avoid the re-identification of individuals? Examples of such measures: removing patients with rare pathologies or shifting time stamps.",
35
  "sensitive_data": "Does the dataset contain data that might be considered sensitive in any way (e.g., data that reveals racial or ethnic origins, sexual orientations, religious beliefs, political opinions or union memberships, or locations; financial or health data; biometric or genetic data; forms of government identification, such as social security numbers; criminal history)? If so, please provide a description."
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
36
  }
37
  }
38
 
 
33
  "offensive_data": "Does the dataset contain data that, if viewed directly, might be offensive, insulting, threatening, or might otherwise cause anxiety? If so, please describe why.",
34
  "de_identification": "If the dataset has been de-identified, were any measures taken to avoid the re-identification of individuals? Examples of such measures: removing patients with rare pathologies or shifting time stamps.",
35
  "sensitive_data": "Does the dataset contain data that might be considered sensitive in any way (e.g., data that reveals racial or ethnic origins, sexual orientations, religious beliefs, political opinions or union memberships, or locations; financial or health data; biometric or genetic data; forms of government identification, such as social security numbers; criminal history)? If so, please provide a description."
36
+ },
37
+ "Devices and Contextual Attributes in Data Collection": {
38
+ "device_details": "For data that requires a device for collection or where the context of the experiment affects the outcome, provide relevant information based on the device or context used.",
39
+ "MRI_machine_used": "If an MRI machine was used, what is the machine and model?",
40
+ "heart_rate_device": "If heart rate was measured, what device was used for measuring heart rate variation?",
41
+ "cortisol_measurement_details": "If cortisol measurement is reported at multiple sites, provide details.",
42
+ "smartphones_used": "If smartphones were used to collect data, provide the names of models.",
43
+ "additional_info": "Provide any other relevant information or details not covered in the above questions."
44
+ },
45
+ "Challenge in Tests and Confounding Factors": {
46
+ "limitation_factors": "Which factors in the data might limit the generalization of potentially derived models?",
47
+ "auxiliary_labels_info": "Is information available as auxiliary labels for challenge tests?",
48
+ "device_diversity": "Describe the number and diversity of devices included in the dataset.",
49
+ "recording_specificities": "Provide details on data recording specificities, e.g., views for chest x-ray images.",
50
+ "recording_sites_info": "Provide information on the number and diversity of recording sites included in the dataset.",
51
+ "distribution_shifts": "Describe any distribution shifts over time in the data.",
52
+ "confounding_factors": "What confounding factors might be present in the data?"
53
+ },
54
+ "Collection and Use of Demographic Information": {
55
+ "demographic_sub_populations": "Does the dataset identify any demographic sub-populations (e.g., by age, gender, ethnicity)?",
56
+ "demographic_categories_assessment": "If yes, describe the reasons these categories were assessed and how this information was acquired.",
57
+ "patient_consent_info": "If patients’ demographic data is included, did they consent to the collection and use of this information?",
58
+ "demographic_outcome_associations": "Are there any known associations between demographics and the outcomes in this dataset?",
59
+ "demographic_update_mechanism": "Is there a mechanism for updating demographic information after its initial collection?",
60
+ "demographic_subgroup_distribution": "Provide a description of the distribution of each subgroup population within the dataset.",
61
+ "regulation_info": "If no demographic data is collected, is there any regulation that prevents such collection?"
62
+ },
63
+ "Pre-processing / De-identification": {
64
+ "de_identification_processing": "Was there any pre-processing done for de-identification of the patients?",
65
+ "data_cleaning_processing": "Was there any pre-processing done for cleaning the data?",
66
+ "raw_data_availability": "Is 'raw' data (post de-identification) saved and available?",
67
+ "exclusion_criteria": "Were any instances excluded from the dataset at the time of preprocessing? If so, why?"
68
+ },
69
+ "Labeling and Subjectivity of Labeling": {
70
+ "explicit_labels": "Is there an explicit label or target associated with each data instance?",
71
+ "label_details": "If yes, describe the labels provided, who performed the labeling, and the labeling strategy used.",
72
+ "label_definition": "If proxy labels are used, provide the label definition.",
73
+ "gold_standard_labels": "What proportion of the data has gold standard labels?",
74
+ "labeller_demographics": "Provide information on the demographics of the labellers and the guidelines they followed.",
75
+ "label_annotation_time": "On average, how much time was required to annotate each instance?",
76
+ "labeller_compensation": "Were the labellers compensated for their time? If so, how?"
77
+ },
78
+ "Collection Process": {
79
+ "REB_IRB_approval": "Were any REB/IRB approvals received for data collection?",
80
+ "data_acquisition_details": "How was the data associated with each instance acquired?",
81
+ "data_collection_mechanisms": "What mechanisms or procedures were used to collect the data?",
82
+ "data_collection_participants": "Who was involved in the data collection process, and how were they compensated?",
83
+ "data_collection_timeframe": "Over what timeframe was the data collected?"
84
  }
85
  }
86