From 23c156ab2c8b1d1cfd46b74df4e575f49bea92ea Mon Sep 17 00:00:00 2001 From: Jan Lukas Gernert Date: Sun, 12 Mar 2023 13:39:17 +0100 Subject: [PATCH] add new test --- .../tests/readability/dev418/expected.html | 52 +++++++++ .../tests/readability/dev418/source.html | 104 ++++++++++++++++++ src/full_text_parser/readability/tests.rs | 5 + 3 files changed, 161 insertions(+) create mode 100644 resources/tests/readability/dev418/expected.html create mode 100644 resources/tests/readability/dev418/source.html diff --git a/resources/tests/readability/dev418/expected.html b/resources/tests/readability/dev418/expected.html new file mode 100644 index 0000000..98e12f8 --- /dev/null +++ b/resources/tests/readability/dev418/expected.html @@ -0,0 +1,52 @@ +
+

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+
+

+ Single <img> +

+

An image

+

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+
+

+ Single <figure> +

+
An image
+ Caption of the figure +

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+
+

+ <ul> List of <img> +

+
    +
  • An image
  • +
  • An image
  • +
  • An image
  • +
+

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+
+

+ <ul> List of <figure> +

+
    +
  • An image
    + Caption of the figure +
  • +
  • An image
    + Caption of the figure +
  • +
  • An image
    + Caption of the figure +
  • +
+

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+
diff --git a/resources/tests/readability/dev418/source.html b/resources/tests/readability/dev418/source.html new file mode 100644 index 0000000..9857248 --- /dev/null +++ b/resources/tests/readability/dev418/source.html @@ -0,0 +1,104 @@ + + + + + + Readability Test + + + + +

+ Readability Test +

+

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+
+

+ Single <img> +

+

+ An image +

+

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+
+

+ Single <figure> +

+
+ An image +
+ Caption of the figure +
+
+

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+
+

+ <ul> List of <img> +

+ +

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+
+

+ <ul> List of <figure> +

+ +

+ Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +

+ + diff --git a/src/full_text_parser/readability/tests.rs b/src/full_text_parser/readability/tests.rs index 192a834..0f30591 100644 --- a/src/full_text_parser/readability/tests.rs +++ b/src/full_text_parser/readability/tests.rs @@ -161,6 +161,11 @@ async fn data_url_image() { run_test("data-url-image").await } +#[tokio::test] +async fn dev418() { + run_test("dev418").await +} + #[tokio::test] async fn webmd_1() { run_test("webmd-1").await