Update web.py
Browse files
web.py
CHANGED
|
@@ -449,7 +449,7 @@ def web_data():
|
|
| 449 |
|
| 450 |
Details(
|
| 451 |
Summary("Sample documents that are classified as English but with score less than 0.65"),
|
| 452 |
-
DV("data/sample_en_low.json",3),
|
| 453 |
),
|
| 454 |
|
| 455 |
H4("1.3 URL Filtering"),
|
|
@@ -485,7 +485,7 @@ def web_data():
|
|
| 485 |
|
| 486 |
Details(
|
| 487 |
Summary("Sample documents whose urls are in our curated url domain list"),
|
| 488 |
-
DV("data/sample_url_exclusion.json", 0
|
| 489 |
),
|
| 490 |
H3("2. Line-Level Removal"),
|
| 491 |
P("""
|
|
|
|
| 449 |
|
| 450 |
Details(
|
| 451 |
Summary("Sample documents that are classified as English but with score less than 0.65"),
|
| 452 |
+
DV("data/sample_en_low.json", 3),
|
| 453 |
),
|
| 454 |
|
| 455 |
H4("1.3 URL Filtering"),
|
|
|
|
| 485 |
|
| 486 |
Details(
|
| 487 |
Summary("Sample documents whose urls are in our curated url domain list"),
|
| 488 |
+
DV("data/sample_url_exclusion.json", 0),
|
| 489 |
),
|
| 490 |
H3("2. Line-Level Removal"),
|
| 491 |
P("""
|