diff --git a/tika-parsers/src/main/java/org/apache/tika/parser/html/HtmlEncodingDetector.java b/tika-parsers/src/main/java/org/apache/tika/parser/html/HtmlEncodingDetector.java
index 559ec4d..73f394a 100644
--- a/tika-parsers/src/main/java/org/apache/tika/parser/html/HtmlEncodingDetector.java
+++ b/tika-parsers/src/main/java/org/apache/tika/parser/html/HtmlEncodingDetector.java
@@ -112,6 +112,11 @@
             //that is valid
             while (charsetMatcher.find()) {
                 String candCharset = charsetMatcher.group(1);
+                // TIKA-2592 - html-content with encoding "unicode" is set to UTF-8
+                // If this case is not handled, the resulting Charset.forName("unicode") will return UTF-16 instead
+                if ( "unicode".equalsIgnoreCase( candCharset ) ) {
+                    return Charset.forName( "UTF-8" );
+                }
                 if (CharsetUtils.isSupported(candCharset)) {
                     try {
                         return CharsetUtils.forName(candCharset);
