Spaces:
Running
Running
victormiller
commited on
Commit
•
752d87b
1
Parent(s):
95edc44
Update common.py
Browse files
common.py
CHANGED
@@ -43,7 +43,9 @@ r"[A-Za-z0-9!#$%&'*+/=?^_`{|}~-]+(?:\.[A-Za-z0-9!#$%&'*+/=?^_`{|}~-]+)*@(?:(?:[A
|
|
43 |
[0-5]|2[0-4][0-9]|[" r"01]?[0-9][0-9]?)\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?
|
44 |
|[A-Za-z0-9-]*[A-Za-z0-9]:)])
|
45 |
"""
|
46 |
-
|
|
|
|
|
47 |
global_div = Div(
|
48 |
Section(
|
49 |
H2("Global Steps"),
|
@@ -103,7 +105,7 @@ global_div = Div(
|
|
103 |
H3("Removing PII"),
|
104 |
P("We have removed two types of PII from the dataset: email address and IP address. Regular expressions are used to identify and replace these PII with a generic placeholder. Below is an example of how we removed email addresses from the dataset:"),
|
105 |
P("We have used the following regular expressions to identify and replace PII:"),
|
106 |
-
Ul(Li("Email:"), Li(email_code, style="list-style-type: none"), Li("IP Address: NEED TO UPDATE")),
|
107 |
),
|
108 |
Section(
|
109 |
H2("Normalization Form C (NFC)"),
|
|
|
43 |
[0-5]|2[0-4][0-9]|[" r"01]?[0-9][0-9]?)\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?
|
44 |
|[A-Za-z0-9-]*[A-Za-z0-9]:)])
|
45 |
"""
|
46 |
+
ip_address_code = """
|
47 |
+
r"(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)"
|
48 |
+
"""
|
49 |
global_div = Div(
|
50 |
Section(
|
51 |
H2("Global Steps"),
|
|
|
105 |
H3("Removing PII"),
|
106 |
P("We have removed two types of PII from the dataset: email address and IP address. Regular expressions are used to identify and replace these PII with a generic placeholder. Below is an example of how we removed email addresses from the dataset:"),
|
107 |
P("We have used the following regular expressions to identify and replace PII:"),
|
108 |
+
Ul(Li("Email:"), Li(email_code, style="list-style-type: none"), Li("IP Address: NEED TO UPDATE"), Li(ip_address_code, style="list-style-type: none")),
|
109 |
),
|
110 |
Section(
|
111 |
H2("Normalization Form C (NFC)"),
|