|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |
java.lang.ObjectTestCase
org.apache.tika.parser.html.HtmlParserTest
public class HtmlParserTest
Constructor Summary | |
---|---|
HtmlParserTest()
|
Method Summary | |
---|---|
void |
testBaseHref()
Test case for TIKA-287 |
void |
testCharactersDirectlyUnderBodyElement()
Test case for TIKA-210 |
void |
testDetectOfCharset()
Test case for TIKA-334 |
void |
testHttpEquivCharset()
Test case for TIKA-332 |
void |
testHttpEquivCharsetFunkyAttributes()
Test case for TIKA-349 |
void |
testIgnoreCharsetDetectorLanguage()
Test case for TIKA-339: Don't use language returned by CharsetDetector |
void |
testLineBreak()
Test case for HTML content like ">div<foo>br<bar>/div>" that should result in three whitespace-separated tokens "foo", "bar" and "baz" instead of a single token "foobarbaz". |
void |
testMetaHttpEquivWithLotsOfPreambleText()
Test case for TIKA-357 |
void |
testParseAscii()
|
void |
testParseEmpty()
|
void |
testUsingCharsetInContentTypeHeader()
Test case for TIKA-341 |
void |
testUsingFunkyCharsetInContentTypeHeader()
Test case for TIKA-350 |
void |
testWhitespaceBetweenTableCells()
Test case for TIKA-268 |
void |
testXhtmlParsing()
|
void |
XtestParseUTF8()
|
Methods inherited from class java.lang.Object |
---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
Constructor Detail |
---|
public HtmlParserTest()
Method Detail |
---|
public void testParseAscii() throws java.lang.Exception
java.lang.Exception
public void XtestParseUTF8() throws java.io.IOException, org.xml.sax.SAXException, org.apache.tika.exception.TikaException
java.io.IOException
org.xml.sax.SAXException
org.apache.tika.exception.TikaException
public void testXhtmlParsing() throws java.lang.Exception
java.lang.Exception
public void testParseEmpty() throws java.lang.Exception
java.lang.Exception
public void testCharactersDirectlyUnderBodyElement() throws java.lang.Exception
java.lang.Exception
public void testBaseHref() throws java.lang.Exception
java.lang.Exception
public void testWhitespaceBetweenTableCells() throws java.lang.Exception
java.lang.Exception
public void testHttpEquivCharset() throws java.lang.Exception
java.lang.Exception
public void testDetectOfCharset() throws java.lang.Exception
java.lang.Exception
public void testUsingCharsetInContentTypeHeader() throws java.lang.Exception
java.lang.Exception
public void testLineBreak() throws java.lang.Exception
java.lang.Exception
public void testIgnoreCharsetDetectorLanguage() throws java.lang.Exception
java.lang.Exception
public void testHttpEquivCharsetFunkyAttributes() throws java.lang.Exception
java.lang.Exception
public void testUsingFunkyCharsetInContentTypeHeader() throws java.lang.Exception
java.lang.Exception
public void testMetaHttpEquivWithLotsOfPreambleText() throws java.lang.Exception
java.lang.Exception
|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |