change ? to ^

This commit is contained in:
momo 2015-10-08 13:01:17 -04:00
parent f7cb43f363
commit e0547aaebf

View File

@ -69,7 +69,7 @@ class AbstractFileChunk {
// Given a byte array, filter out all occurances non-characters
// http://unicode.org/cldr/utility/list-unicodeset.jsp?a=[:Noncharacter_Code_Point=True:]
// and non-printable control characters except tabulator, new line and carriage return
// and replace them with the question mark character (?)
// and replace them with the character (^)
private static byte[] sanitize(byte[] input) {
Charset charset = Charset.forName("UTF-8"); // NON-NLS
String inputString = new String(input, charset);
@ -80,7 +80,7 @@ class AbstractFileChunk {
if (charIsValidSolrUTF8(ch)) {
sanitized.append(ch);
} else {
sanitized.append("?"); // NON-NLS
sanitized.append('^'); // NON-NLS
}
}