1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17 package org.apache.tika.parser.opendocument;
18
19 import java.io.InputStream;
20
21 import junit.framework.TestCase;
22
23 import org.apache.tika.metadata.Metadata;
24 import org.apache.tika.sax.BodyContentHandler;
25 import org.xml.sax.ContentHandler;
26
27 import org.apache.tika.parser.odf.OpenDocumentParser;
28
29 public class ODFParserTest extends TestCase {
30
31 public void testXMLParser() throws Exception {
32 InputStream input = ODFParserTest.class.getResourceAsStream(
33 "/test-documents/testODFwithOOo3.odt");
34 try {
35 Metadata metadata = new Metadata();
36 ContentHandler handler = new BodyContentHandler();
37 new OpenDocumentParser().parse(input, handler, metadata);
38
39 assertEquals(
40 "application/vnd.oasis.opendocument.text",
41 metadata.get(Metadata.CONTENT_TYPE));
42
43 String content = handler.toString();
44 assertTrue(content.contains("Tika is part of the Lucene project."));
45 assertTrue(content.contains("Solr"));
46 assertTrue(content.contains("one embedded"));
47 assertTrue(content.contains("Rectangle Title"));
48 assertTrue(content.contains("a blue background and dark border")); } finally {
49 input.close();
50 }
51 }
52
53 }