victormiller
commited on
Commit
•
5236603
1
Parent(s):
44f2e3d
Update common.py
Browse files
common.py
CHANGED
@@ -47,6 +47,10 @@ ip_address_code = """
|
|
47 |
r"(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)"
|
48 |
"""
|
49 |
|
|
|
|
|
|
|
|
|
50 |
pii_table = pd.DataFrame(
|
51 |
{
|
52 |
"OPII Type": [
|
@@ -136,7 +140,8 @@ global_div = Div(
|
|
136 |
),
|
137 |
Section(
|
138 |
H3("NFC Implementation"),
|
139 |
-
P("We have used the ftfy library to normalize the text to NFC. The library provides a simple API for normalizing text to NFC, which can be applied to the entire dataset one row at a time. Below is the code snippet about how we normalized text to NFC:
|
|
|
140 |
),
|
141 |
Section(
|
142 |
H3("NFC Examples"),
|
|
|
47 |
r"(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)"
|
48 |
"""
|
49 |
|
50 |
+
nfc_code = """
|
51 |
+
ftfy.fix_text(text, normalization="NFC")
|
52 |
+
"""
|
53 |
+
|
54 |
pii_table = pd.DataFrame(
|
55 |
{
|
56 |
"OPII Type": [
|
|
|
140 |
),
|
141 |
Section(
|
142 |
H3("NFC Implementation"),
|
143 |
+
P("We have used the ftfy library to normalize the text to NFC. The library provides a simple API for normalizing text to NFC, which can be applied to the entire dataset one row at a time. Below is the code snippet about how we normalized text to NFC:"),
|
144 |
+
Ul(Li(nfc_code, style="list-style-type: none")),
|
145 |
),
|
146 |
Section(
|
147 |
H3("NFC Examples"),
|