From c5a88d6d8b22e12c2bb6fb1c8a4409d7eba66b2b Mon Sep 17 00:00:00 2001 From: "Michael[tm] Smith" Date: Sun, 13 Sep 2020 04:14:19 +0900 Subject: [PATCH] Correct non-UTF8 handling in HtmlInputStreamReader This change corrects the code to set the right encoding in the case when the external encoding has been determined to be non-UTF8. --- src/nu/validator/htmlparser/io/HtmlInputStreamReader.java | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/nu/validator/htmlparser/io/HtmlInputStreamReader.java b/src/nu/validator/htmlparser/io/HtmlInputStreamReader.java index 45e0278f..c54e591a 100755 --- a/src/nu/validator/htmlparser/io/HtmlInputStreamReader.java +++ b/src/nu/validator/htmlparser/io/HtmlInputStreamReader.java @@ -169,7 +169,8 @@ public HtmlInputStreamReader(InputStream inputStream, } else { err(Encoding.msgLegacyEncoding(encoding.getCanonName())); if (driver != null) { - driver.setEncoding(Encoding.UTF16, Confidence.CERTAIN); + // XXX Why did we do driver.setEncoding(encoding.UTF16... ? + driver.setEncoding(encoding, Confidence.CERTAIN); } } }