1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17 package org.apache.tika.parser.html;
18
19
20
21
22
23
24 public class DefaultHtmlMapper implements HtmlMapper {
25
26 public String mapSafeElement(String name) {
27
28
29 if ("H1".equals(name)) return "h1";
30 if ("H2".equals(name)) return "h2";
31 if ("H3".equals(name)) return "h3";
32 if ("H4".equals(name)) return "h4";
33 if ("H5".equals(name)) return "h5";
34 if ("H6".equals(name)) return "h6";
35
36 if ("P".equals(name)) return "p";
37 if ("PRE".equals(name)) return "pre";
38 if ("BLOCKQUOTE".equals(name)) return "blockquote";
39
40 if ("UL".equals(name)) return "ul";
41 if ("OL".equals(name)) return "ol";
42 if ("MENU".equals(name)) return "ul";
43 if ("LI".equals(name)) return "li";
44 if ("DL".equals(name)) return "dl";
45 if ("DT".equals(name)) return "dt";
46 if ("DD".equals(name)) return "dd";
47
48 if ("TABLE".equals(name)) return "table";
49 if ("THEAD".equals(name)) return "thead";
50 if ("TBODY".equals(name)) return "tbody";
51 if ("TR".equals(name)) return "tr";
52 if ("TH".equals(name)) return "th";
53 if ("TD".equals(name)) return "td";
54
55 if ("ADDRESS".equals(name)) return "address";
56
57 return null;
58 }
59
60 public boolean isDiscardElement(String name) {
61 return "STYLE".equals(name) || "SCRIPT".equals(name);
62 }
63
64 }