TeStereo report
APIUtilityVerifier InternalCallVerifier BooleanVerifier IgnoredMethod HybridVerifier
@Test @Ignore("The file 'testXHTML_utf8.html' is not available fo testing") public void XtestParseUTF8() throws IOException, SAXException, TikaException {
String path="/test-documents/testXHTML_utf8.html";
Metadata metadata=new Metadata();
String content=new Tika().parseToString(HtmlParserTest.class.getResourceAsStream(path),metadata);
assertTrue("Did not contain expected text:" + "Title : Tilte with UTF-8 chars öäå",content.contains("Title : Tilte with UTF-8 chars öäå"));
assertTrue("Did not contain expected text:" + "Content with UTF-8 chars",content.contains("Content with UTF-8 chars"));
assertTrue("Did not contain expected text:" + "åäö",content.contains("åäö"));
}