From 8532d1dc4c04a4a47648c00d60140b9e65c7fdae Mon Sep 17 00:00:00 2001 From: "U-BASIS\\dsmyda" Date: Mon, 20 Jul 2020 11:43:16 -0400 Subject: [PATCH] Added link to TIKA story about IBM500 issue --- .../sleuthkit/autopsy/coreutils/textutils/EncodingUtils.java | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/Core/src/org/sleuthkit/autopsy/coreutils/textutils/EncodingUtils.java b/Core/src/org/sleuthkit/autopsy/coreutils/textutils/EncodingUtils.java index 95e9ab20a6..e4fc7019c9 100755 --- a/Core/src/org/sleuthkit/autopsy/coreutils/textutils/EncodingUtils.java +++ b/Core/src/org/sleuthkit/autopsy/coreutils/textutils/EncodingUtils.java @@ -89,7 +89,7 @@ public class EncodingUtils { detector.setText(stream); CharsetMatch[] tikaResults = detector.detectAll(); - // Get all guesses by Tika. These CharsetMatch's are ordered + // Get all guesses by Tika. These matches are ordered // by descending confidence (largest first). if (tikaResults.length > 0) { CharsetMatch topPick = tikaResults[0]; @@ -98,7 +98,8 @@ public class EncodingUtils { // Legacy encoding, let's discard this one in favor // of the second pick. Tika has some problems with // mistakenly identifying text as IBM500. See JIRA-6600 - // for more details. + // and https://issues.apache.org/jira/browse/TIKA-2771 for + // more details. topPick = tikaResults[1]; }