victormiller
commited on
Commit
•
f43eed3
1
Parent(s):
b6c8b4f
Update curated.py
Browse files- curated.py +1 -1
curated.py
CHANGED
@@ -599,7 +599,7 @@ filtering_process = Div(
|
|
599 |
Section(
|
600 |
H3("FreeLaw"),
|
601 |
H4("Download and Extraction"),
|
602 |
-
P("The dataset was downloaded from:" A("https://storage.courtlistener.com/bulk-data/", href="https://storage.courtlistener.com/bulk-data/"), )#". There are 19 CSV files which contain overlapping content. CSV files can contain content in multiple columns requiring a holistic extraction approach. Text was extracted from the following using html2text function. The block below shows how each text type was extracted."),
|
603 |
D_code("""
|
604 |
("html", html2text),
|
605 |
("html_lawbox", html2text),
|
|
|
599 |
Section(
|
600 |
H3("FreeLaw"),
|
601 |
H4("Download and Extraction"),
|
602 |
+
#P("The dataset was downloaded from:" A("https://storage.courtlistener.com/bulk-data/", href="https://storage.courtlistener.com/bulk-data/"), )#". There are 19 CSV files which contain overlapping content. CSV files can contain content in multiple columns requiring a holistic extraction approach. Text was extracted from the following using html2text function. The block below shows how each text type was extracted."),
|
603 |
D_code("""
|
604 |
("html", html2text),
|
605 |
("html_lawbox", html2text),
|