File tree Expand file tree Collapse file tree 3 files changed +5
-4
lines changed
main/resources/META-INF/services
java/org/apache/tika/config
resources/org/apache/tika/config Expand file tree Collapse file tree 3 files changed +5
-4
lines changed Original file line number Diff line number Diff line change 1313# See the License for the specific language governing permissions and
1414# limitations under the License.
1515
16- org.apache.tika.parser.html.HtmlEncodingDetector
16+ org.apache.tika.parser.html.charsetdetector.StandardHtmlEncodingDetector
1717org.apache.tika.parser.txt.UniversalEncodingDetector
1818org.apache.tika.parser.txt.Icu4jEncodingDetector
Original file line number Diff line number Diff line change 3939import org .apache .tika .parser .Parser ;
4040import org .apache .tika .parser .ParserDecorator ;
4141import org .apache .tika .parser .html .HtmlEncodingDetector ;
42+ import org .apache .tika .parser .html .charsetdetector .StandardHtmlEncodingDetector ;
4243import org .apache .tika .parser .txt .Icu4jEncodingDetector ;
4344import org .apache .tika .parser .txt .TXTParser ;
4445import org .apache .tika .parser .txt .UniversalEncodingDetector ;
@@ -52,7 +53,7 @@ public void testDefault() {
5253 assertTrue (detector instanceof CompositeEncodingDetector );
5354 List <EncodingDetector > detectors = ((CompositeEncodingDetector ) detector ).getDetectors ();
5455 assertEquals (3 , detectors .size ());
55- assertTrue (detectors .get (0 ) instanceof HtmlEncodingDetector );
56+ assertTrue (detectors .get (0 ) instanceof StandardHtmlEncodingDetector );
5657 assertTrue (detectors .get (1 ) instanceof UniversalEncodingDetector );
5758 assertTrue (detectors .get (2 ) instanceof Icu4jEncodingDetector );
5859 }
Original file line number Diff line number Diff line change 1919 <!-- Explicitly request default parsers -->
2020 <parsers />
2121 <encodingDetectors >
22- <!-- All detectors except HtmlEncodingDetector -->
22+ <!-- All detectors except StandardHtmlEncodingDetector -->
2323 <encodingDetector class =" org.apache.tika.detect.DefaultEncodingDetector" >
24- <encodingDetector-exclude class =" org.apache.tika.parser.html.HtmlEncodingDetector " />
24+ <encodingDetector-exclude class =" org.apache.tika.parser.html.charsetdetector.StandardHtmlEncodingDetector " />
2525 </encodingDetector >
2626 <!-- One other detector, to check ordering -->
2727 <encodingDetector class =" org.apache.tika.detect.NonDetectingEncodingDetector" />
You can’t perform that action at this time.
0 commit comments