From 2979aaf4aa6f79922dab2a6366f800c874302354 Mon Sep 17 00:00:00 2001 From: Sebastian Nagel Date: Thu, 17 Oct 2019 11:58:36 +0200 Subject: [PATCH] [BasicNormalizer] Trailing question mark in url query test should be added, fixes #247 --- CHANGES.txt | 1 + src/test/resources/normalizer/weirdToNormalizedUrls.csv | 5 ++++- 2 files changed, 5 insertions(+), 1 deletion(-) diff --git a/CHANGES.txt b/CHANGES.txt index 7562a69..d28e267 100644 --- a/CHANGES.txt +++ b/CHANGES.txt @@ -1,6 +1,7 @@ Crawler-Commons Change Log Current Development 1.1-SNAPSHOT (yyyy-mm-dd) +- [BasicNormalizer] Trailing question mark in url query test should be added (Chaiavi, sebastian-nagel) #247 - EffectiveTldFinder to validate returned domain names for length restrictions (sebastian-nagel, Chaiavi) #251 - Upgrade unit tests to use JUnit v5.x and parameterized tests (Chaiavi) #249, #253, #255 - [Robots] Robots parser to always handle absolute sitemap URL even without valid base URL (pr3mar, kkrugler, sebastian-nagel) #240 diff --git a/src/test/resources/normalizer/weirdToNormalizedUrls.csv b/src/test/resources/normalizer/weirdToNormalizedUrls.csv index 4afb2a1..3b20d8f 100644 --- a/src/test/resources/normalizer/weirdToNormalizedUrls.csv +++ b/src/test/resources/normalizer/weirdToNormalizedUrls.csv @@ -126,4 +126,7 @@ file:///foo/bar.txt, file:///foo/bar.txt ftp:/, ftp:/ http:, http:/ http:////, http:/ -http:///////, http:/ \ No newline at end of file +http:///////, http:/ + +# empty path with trailing question mark (empty query) #247 +http://example.com?,http://example.com/?