1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17 package org.apache.tika.parser.microsoft;
18
19 import java.io.InputStream;
20
21 import org.apache.tika.metadata.Metadata;
22 import org.apache.tika.sax.BodyContentHandler;
23 import org.xml.sax.ContentHandler;
24
25 import junit.framework.TestCase;
26
27 public class PowerPointParserTest extends TestCase {
28
29 public void testPowerPointParser() throws Exception {
30 InputStream input = PowerPointParserTest.class.getResourceAsStream(
31 "/test-documents/testPPT.ppt");
32 try {
33 Metadata metadata = new Metadata();
34 ContentHandler handler = new BodyContentHandler();
35 new OfficeParser().parse(input, handler, metadata);
36
37 assertEquals(
38 "application/vnd.ms-powerpoint",
39 metadata.get(Metadata.CONTENT_TYPE));
40 assertEquals("Sample Powerpoint Slide", metadata.get(Metadata.TITLE));
41 assertEquals("Keith Bennett", metadata.get(Metadata.AUTHOR));
42 String content = handler.toString();
43 assertTrue(content.contains("Sample Powerpoint Slide"));
44 assertTrue(content.contains("Powerpoint X for Mac"));
45 } finally {
46 input.close();
47 }
48 }
49
50 }