1 | |
|
2 | |
|
3 | |
|
4 | |
|
5 | |
|
6 | |
|
7 | |
|
8 | |
|
9 | |
|
10 | |
|
11 | |
|
12 | |
|
13 | |
|
14 | |
|
15 | |
package org.apache.tapestry.util.text; |
16 | |
|
17 | |
|
18 | |
|
19 | |
|
20 | |
|
21 | |
|
22 | |
|
23 | |
|
24 | |
|
25 | |
public class MarkupCharacterTranslator implements ICharacterTranslator { |
26 | |
|
27 | |
private static final String SAFE_CHARACTERS = "01234567890" |
28 | |
+ "abcdefghijklmnopqrstuvwxyz" + "ABCDEFGHIJKLMNOPQRSTUVWXYZ" |
29 | |
+ "\t\n\r !#$%'()*+,-./:;=?@[\\]^_`{|}~"; |
30 | |
|
31 | 0 | private static final String[][] ENTITIES = { |
32 | |
{"\"", """}, |
33 | |
{"<", "<"}, {">", ">"}, {"&", "&"} |
34 | |
}; |
35 | |
|
36 | 0 | private static final ICharacterMatcher SAFE_MATCHER = new AsciiCharacterMatcher(SAFE_CHARACTERS); |
37 | 0 | private static final ICharacterTranslator ENTITY_TRANSLATOR = new AsciiCharacterTranslator(ENTITIES); |
38 | |
|
39 | |
private boolean _encodeNonAscii; |
40 | |
private ICharacterMatcher _safeMatcher; |
41 | |
private ICharacterTranslator _entityTranslator; |
42 | |
|
43 | |
public MarkupCharacterTranslator() |
44 | |
{ |
45 | 0 | this(true); |
46 | 0 | } |
47 | |
|
48 | |
public MarkupCharacterTranslator(boolean encodeNonAscii) |
49 | |
{ |
50 | 0 | this(encodeNonAscii, SAFE_MATCHER, ENTITY_TRANSLATOR); |
51 | 0 | } |
52 | |
|
53 | |
public MarkupCharacterTranslator(boolean encodeNonAscii, |
54 | |
ICharacterMatcher safeMatcher, ICharacterTranslator entityTranslator) |
55 | 0 | { |
56 | 0 | _encodeNonAscii = encodeNonAscii; |
57 | 0 | _safeMatcher = safeMatcher; |
58 | 0 | _entityTranslator = entityTranslator; |
59 | 0 | } |
60 | |
|
61 | |
public MarkupCharacterTranslator(boolean encodeNonAscii, |
62 | |
String safeCharacters, String[][] entities) |
63 | 0 | { |
64 | 0 | _encodeNonAscii = encodeNonAscii; |
65 | 0 | _safeMatcher = new AsciiCharacterMatcher(safeCharacters); |
66 | 0 | _entityTranslator = new AsciiCharacterTranslator(entities); |
67 | 0 | } |
68 | |
|
69 | |
|
70 | |
|
71 | |
|
72 | |
public String translate(char ch) |
73 | |
{ |
74 | |
|
75 | |
|
76 | 0 | if (ch >= 160 && !_encodeNonAscii) |
77 | 0 | return null; |
78 | |
|
79 | 0 | if (_safeMatcher.matches(ch)) |
80 | 0 | return null; |
81 | |
|
82 | 0 | String entity = _entityTranslator.translate(ch); |
83 | 0 | if (entity != null) |
84 | 0 | return entity; |
85 | |
|
86 | |
|
87 | |
|
88 | 0 | return "&#" + (int) ch + ";"; |
89 | |
} |
90 | |
} |