--- src/java/au/id/jericho/lib/html/StreamEncodingDetector.java.orig 2008-06-17 21:01:53.890292905 +0200 +++ src/java/au/id/jericho/lib/html/StreamEncodingDetector.java 2008-06-17 21:02:43.940300330 +0200 @@ -203,9 +203,9 @@ // Assume the more likely case of four 8-bit characters <= U+00FF. // Check whether it fits some common EBCDIC strings that might be found at the start of a document: if (b1==0x4C) { // first character is EBCDIC '<' (ASCII 'L'), check a couple more characters before assuming EBCDIC encoding: - if (b2==0x6F && b3==0xA7 && b4==0x94) return setEncoding(EBCDIC,"default EBCDIC encoding ( detected)"); // first four bytes are " detected)"); // first four bytes are " detected)"); // first four bytes are " detected)"); // first four bytes are "