victormiller
commited on
Commit
•
83ec67b
1
Parent(s):
b961e8c
Update curated.py
Browse files- curated.py +1 -2
curated.py
CHANGED
@@ -725,8 +725,7 @@ filtering_process = Div(
|
|
725 |
Div(
|
726 |
H3("HackerNews"),
|
727 |
P("High-quality dialog-based dataset where user comments on the links as the head post aggregated by Y Combinator."),
|
728 |
-
|
729 |
-
P("The dataset was downloaded from the HackerNews repo here:", A("https://hacker-news.firebaseio.com/v0/item/", href="https://hacker-news.firebaseio.com/v0/item/"), ". The dataset was parsed using the Story ID. In this dataset each post is a story, and each reply is considered subsequent story. Story IDs were considered between ID 1 to 37500000. The URL for all Story IDs was pinged. If that ID returned an error, the ID was removed. Each request was given a 2 second wait to account for network time."),
|
730 |
P("The HackerNews dataset contains a vast amount of stories and is known for lively discussions. Due to the number of replies a story may contain, only longest threads included stories from the 3rd level onwards. All stories included the title (1st level) and all direct replies (2nd level). Replies to the replies (3rd level) are only included for X STORIES."),
|
731 |
H4("Filtering"),
|
732 |
Ol(
|
|
|
725 |
Div(
|
726 |
H3("HackerNews"),
|
727 |
P("High-quality dialog-based dataset where user comments on the links as the head post aggregated by Y Combinator."),
|
728 |
+
P(B("Download and Extraction: "), "The dataset was downloaded from the HackerNews repo here:", A("https://hacker-news.firebaseio.com/v0/item/", href="https://hacker-news.firebaseio.com/v0/item/"), ". The dataset was parsed using the Story ID. In this dataset each post is a story, and each reply is considered subsequent story. Story IDs were considered between ID 1 to 37500000. The URL for all Story IDs was pinged. If that ID returned an error, the ID was removed. Each request was given a 2 second wait to account for network time."),
|
|
|
729 |
P("The HackerNews dataset contains a vast amount of stories and is known for lively discussions. Due to the number of replies a story may contain, only longest threads included stories from the 3rd level onwards. All stories included the title (1st level) and all direct replies (2nd level). Replies to the replies (3rd level) are only included for X STORIES."),
|
730 |
H4("Filtering"),
|
731 |
Ol(
|