shivarama23
commited on
Commit
•
e1e1053
1
Parent(s):
1fe393b
Llama v2 finetuned for redaction of PIIs
Browse files- README.md +9 -0
- adapter_config.json +21 -0
- adapter_model.bin +3 -0
- added_tokens.json +3 -0
- dataset.json +112 -0
- special_tokens_map.json +24 -0
- tokenizer.json +0 -0
README.md
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
tags:
|
3 |
+
- autotrain
|
4 |
+
- text-generation
|
5 |
+
widget:
|
6 |
+
- text: "I love AutoTrain because "
|
7 |
+
---
|
8 |
+
|
9 |
+
# Model Trained Using AutoTrain
|
adapter_config.json
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "abhishek/llama-2-7b-hf-small-shards",
|
4 |
+
"bias": "none",
|
5 |
+
"fan_in_fan_out": false,
|
6 |
+
"inference_mode": true,
|
7 |
+
"init_lora_weights": true,
|
8 |
+
"layers_pattern": null,
|
9 |
+
"layers_to_transform": null,
|
10 |
+
"lora_alpha": 32,
|
11 |
+
"lora_dropout": 0.05,
|
12 |
+
"modules_to_save": null,
|
13 |
+
"peft_type": "LORA",
|
14 |
+
"r": 16,
|
15 |
+
"revision": null,
|
16 |
+
"target_modules": [
|
17 |
+
"q_proj",
|
18 |
+
"v_proj"
|
19 |
+
],
|
20 |
+
"task_type": "CAUSAL_LM"
|
21 |
+
}
|
adapter_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07c719f923d3e3878123962fed4f017d052c18a2b2d7203336b974fadfa2b786
|
3 |
+
size 33600461
|
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<pad>": 32000
|
3 |
+
}
|
dataset.json
ADDED
@@ -0,0 +1,112 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"instruction": "redact patient_name, age, disease from the text",
|
4 |
+
"input": "John Doe is a patient who is 45 years old and has been diagnosed with COVID-19. He is currently under observation and receiving appropriate medical care. The doctors are closely monitoring his condition and providing necessary treatment.",
|
5 |
+
"output": "<redacted> is a patient who is <redacted> years old and has been diagnosed with <redacted>. He is currently under observation and receiving appropriate medical care. The doctors are closely monitoring his condition and providing necessary treatment."
|
6 |
+
},
|
7 |
+
{
|
8 |
+
"instruction": "redact patient_name, age, disease from the text",
|
9 |
+
"input": "Jane Smith, aged 32, is currently receiving treatment for Diabetes. She has been prescribed medications and advised to follow a specific diet and lifestyle changes to manage her condition effectively. Regular check-ups are scheduled to monitor her progress.",
|
10 |
+
"output": "<redacted>, aged <redacted>, is currently receiving treatment for <redacted>. She has been prescribed medications and advised to follow a specific diet and lifestyle changes to manage her condition effectively. Regular check-ups are scheduled to monitor her progress."
|
11 |
+
},
|
12 |
+
{
|
13 |
+
"instruction": "redact patient_name, age, disease from the text",
|
14 |
+
"input": "Mary Johnson's Patient Information indicates she is 55 years old and suffering from Hypertension. She has been advised to take her prescribed medications regularly and make lifestyle modifications to control her blood pressure levels. Regular follow-ups with her healthcare provider are scheduled.",
|
15 |
+
"output": "<redacted>'s Patient Information indicates she is <redacted> years old and suffering from <redacted>. She has been advised to take her prescribed medications regularly and make lifestyle modifications to control her blood pressure levels. Regular follow-ups with her healthcare provider are scheduled."
|
16 |
+
},
|
17 |
+
{
|
18 |
+
"instruction": "redact patient_name, age, disease from the text",
|
19 |
+
"input": "Mr. Smith is a 60-year-old man with a diagnosis of Heart Disease. He is under the care of a cardiologist and following a treatment plan to manage his condition. Lifestyle changes, including a heart-healthy diet and exercise, are recommended for his overall well-being.",
|
20 |
+
"output": "<redacted> is a <redacted>-year-old man with a diagnosis of <redacted>. He is under the care of a cardiologist and following a treatment plan to manage his condition. Lifestyle changes, including a heart-healthy diet and exercise, are recommended for his overall well-being."
|
21 |
+
},
|
22 |
+
{
|
23 |
+
"instruction": "redact patient_name, age, disease from the text",
|
24 |
+
"input": "Sarah Miller, aged 40, has been diagnosed with Cancer. She is undergoing chemotherapy and radiation treatments as part of her cancer treatment plan. Support from family and friends has been essential during her journey to recovery.",
|
25 |
+
"output": "<redacted>, aged <redacted>, has been diagnosed with <redacted>. She is undergoing chemotherapy and radiation treatments as part of her cancer treatment plan. Support from family and friends has been essential during her journey to recovery."
|
26 |
+
},
|
27 |
+
{
|
28 |
+
"instruction": "redact patient_name, age, disease from the text",
|
29 |
+
"input": "James Johnson is 28 years old and currently undergoing treatment for COVID-19. He is in isolation to prevent further spread of the virus. The healthcare team is closely monitoring his symptoms and providing supportive care.",
|
30 |
+
"output": "<redacted> is <redacted> years old and currently undergoing treatment for <redacted>. He is in isolation to prevent further spread of the virus. The healthcare team is closely monitoring his symptoms and providing supportive care."
|
31 |
+
},
|
32 |
+
{
|
33 |
+
"instruction": "redact patient_name, age, disease from the text",
|
34 |
+
"input": "Emma Smith, aged 38, has been diagnosed with Asthma. She carries an inhaler with her at all times for quick relief during asthma attacks. Emma is advised to avoid triggers that worsen her symptoms.",
|
35 |
+
"output": "<redacted>, aged <redacted>, has been diagnosed with <redacted>. She carries an inhaler with her at all times for quick relief during asthma attacks. <redacted> is advised to avoid triggers that worsen her symptoms."
|
36 |
+
},
|
37 |
+
{
|
38 |
+
"instruction": "redact patient_name, age, disease from the text",
|
39 |
+
"input": "Laura Johnson's Diagnosis indicates she is 50 years old and suffering from Diabetes. She is managing her blood sugar levels through medication and lifestyle changes, including a balanced diet and regular exercise.",
|
40 |
+
"output": "<redacted>'s Diagnosis indicates she is <redacted> years old and suffering from <redacted>. She is managing her blood sugar levels through medication and lifestyle changes, including a balanced diet and regular exercise."
|
41 |
+
},
|
42 |
+
{
|
43 |
+
"instruction": "redact patient_name, age, disease from the text",
|
44 |
+
"input": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: John Doe, Age: 45, Disease: COVID-19. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio.",
|
45 |
+
"output": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: <redacted>, Age: <redacted>, Disease: <redacted>. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio."
|
46 |
+
},
|
47 |
+
{
|
48 |
+
"instruction": "redact patient_name, age, disease from the text",
|
49 |
+
"input": "Nullam tristique purus ac sapien egestas. Patient: Jane Smith, Age: 32, Diagnosis: Diabetes. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi.",
|
50 |
+
"output": "Nullam tristique purus ac sapien egestas. Patient: <redacted>, Age: <redacted>, Diagnosis: <redacted>. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi."
|
51 |
+
},
|
52 |
+
{
|
53 |
+
"instruction": "redact patient_name, age, disease from the text",
|
54 |
+
"input": "Proin sagittis sapien vitae lorem dictum. Patient Information: Mary Johnson, Age: 55, Disease: Hypertension. Fusce sit amet quam nec odio posuere vestibulum vel in erat. Vivamus eleifend nunc purus, a fringilla ligula venenatis ac. In semper quam quis quam varius, quis rutrum lacus interdum.",
|
55 |
+
"output": "Proin sagittis sapien vitae lorem dictum. Patient Information: <redacted>, Age: <redacted>, Disease: <redacted>. Fusce sit amet quam nec odio posuere vestibulum vel in erat. Vivamus eleifend nunc purus, a fringilla ligula venenatis ac. In semper quam quis quam varius, quis rutrum lacus interdum."
|
56 |
+
},
|
57 |
+
{
|
58 |
+
"instruction": "redact patient_name, age, disease from the text",
|
59 |
+
"input": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: Alice Johnson, Age: 27, Disease: COVID-19. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio.",
|
60 |
+
"output": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: <redacted>, Age: <redacted>, Disease: <redacted>. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio."
|
61 |
+
},
|
62 |
+
{
|
63 |
+
"instruction": "redact patient_name, age, disease from the text",
|
64 |
+
"input": "Nullam tristique purus ac sapien egestas. Patient: James Smith, Age: 50, Diagnosis: Asthma. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi.",
|
65 |
+
"output": "Nullam tristique purus ac sapien egestas. Patient: <redacted>, Age: <redacted>, Diagnosis: <redacted>. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi."
|
66 |
+
},
|
67 |
+
{
|
68 |
+
"instruction": "redact patient_name, age, disease from the text",
|
69 |
+
"input": "Proin sagittis sapien vitae lorem dictum. Patient Information: Mary Johnson, Age: 55, Disease: Hypertension. Fusce sit amet quam nec odio posuere vestibulum vel in erat. Vivamus eleifend nunc purus, a fringilla ligula venenatis ac. In semper quam quis quam varius, quis rutrum lacus interdum.",
|
70 |
+
"output": "Proin sagittis sapien vitae lorem dictum. Patient Information: <redacted>, Age: <redacted>, Disease: <redacted>. Fusce sit amet quam nec odio posuere vestibulum vel in erat. Vivamus eleifend nunc purus, a fringilla ligula venenatis ac. In semper quam quis quam varius, quis rutrum lacus interdum."
|
71 |
+
},
|
72 |
+
{
|
73 |
+
"instruction": "redact patient_name, age, disease from the text",
|
74 |
+
"input": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: John Doe, Age: 45, Disease: COVID-19. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio.",
|
75 |
+
"output": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: <redacted>, Age: <redacted>, Disease: <redacted>. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio."
|
76 |
+
},
|
77 |
+
{
|
78 |
+
"instruction": "redact patient_name, age, disease from the text",
|
79 |
+
"input": "Nullam tristique purus ac sapien egestas. Patient: Jane Smith, Age: 32, Diagnosis: Diabetes. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi.",
|
80 |
+
"output": "Nullam tristique purus ac sapien egestas. Patient: <redacted>, Age: <redacted>, Diagnosis: <redacted>. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi."
|
81 |
+
},
|
82 |
+
{
|
83 |
+
"instruction": "redact patient_name, age, disease from the text",
|
84 |
+
"input": "Proin sagittis sapien vitae lorem dictum. Patient Information: Mary Johnson, Age: 55, Disease: Hypertension. Fusce sit amet quam nec odio posuere vestibulum vel in erat. Vivamus eleifend nunc purus, a fringilla ligula venenatis ac. In semper quam quis quam varius, quis rutrum lacus interdum.",
|
85 |
+
"output": "Proin sagittis sapien vitae lorem dictum. Patient Information: <redacted>, Age: <redacted>, Disease: <redacted>. Fusce sit amet quam nec odio posuere vestibulum vel in erat. Vivamus eleifend nunc purus, a fringilla ligula venenatis ac. In semper quam quis quam varius, quis rutrum lacus interdum."
|
86 |
+
},
|
87 |
+
{
|
88 |
+
"instruction": "redact patient_name, age, disease from the text",
|
89 |
+
"input": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: Alice Johnson, Age: 27, Disease: COVID-19. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio.",
|
90 |
+
"output": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: <redacted>, Age: <redacted>, Disease: <redacted>. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio."
|
91 |
+
},
|
92 |
+
{
|
93 |
+
"instruction": "redact patient_name, age, disease from the text",
|
94 |
+
"input": "Nullam tristique purus ac sapien egestas. Patient: James Smith, Age: 50, Diagnosis: Asthma. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi.",
|
95 |
+
"output": "Nullam tristique purus ac sapien egestas. Patient: <redacted>, Age: <redacted>, Diagnosis: <redacted>. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi."
|
96 |
+
},
|
97 |
+
{
|
98 |
+
"instruction": "redact patient_name, age, disease from the text",
|
99 |
+
"input": "Proin sagittis sapien vitae lorem dictum. Patient Information: Mary Johnson, Age: 55, Disease: Hypertension. Fusce sit amet quam nec odio posuere vestibulum vel in erat. Vivamus eleifend nunc purus, a fringilla ligula venenatis ac. In semper quam quis quam varius, quis rutrum lacus interdum.",
|
100 |
+
"output": "Proin sagittis sapien vitae lorem dictum. Patient Information: <redacted>, Age: <redacted>, Disease: <redacted>. Fusce sit amet quam nec odio posuere vestibulum vel in erat. Vivamus eleifend nunc purus, a fringilla ligula venenatis ac. In semper quam quis quam varius, quis rutrum lacus interdum."
|
101 |
+
},
|
102 |
+
{
|
103 |
+
"instruction": "redact patient_name, age, disease from the text",
|
104 |
+
"input": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: John Doe, Age: 45, Disease: COVID-19. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio.",
|
105 |
+
"output": "Lorem ipsum dolor sit amet, consectetur adipiscing elit. Patient Name: <redacted>, Age: <redacted>, Disease: <redacted>. Nulla venenatis accumsan id a enim. Integer quis dui sit amet est pellentesque consectetur. Etiam lobortis, quam et lacinia condimentum, urna quam varius velit, ut ultricies neque quam vitae odio."
|
106 |
+
},
|
107 |
+
{
|
108 |
+
"instruction": "redact patient_name, age, disease from the text",
|
109 |
+
"input": "Nullam tristique purus ac sapien egestas. Patient: Jane Smith, Age: 32, Diagnosis: Diabetes. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi.",
|
110 |
+
"output": "Nullam tristique purus ac sapien egestas. Patient: <redacted>, Age: <redacted>, Diagnosis: <redacted>. Phasellus venenatis nisi eget ligula varius luctus. Aenean ac metus dui. Sed sit amet volutpat elit. Mauris eleifend, nulla vel rhoncus tempus, odio arcu tempus libero, ut scelerisque arcu lectus at mi."
|
111 |
+
}
|
112 |
+
]
|
special_tokens_map.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": true,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "</s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"pad_token": "<unk>",
|
17 |
+
"unk_token": {
|
18 |
+
"content": "<unk>",
|
19 |
+
"lstrip": false,
|
20 |
+
"normalized": true,
|
21 |
+
"rstrip": false,
|
22 |
+
"single_word": false
|
23 |
+
}
|
24 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|