|
1 |
| |
|
2 |
| |
|
3 |
| |
|
4 |
| |
|
5 |
| |
|
6 |
| |
|
7 |
| |
|
8 |
| |
|
9 |
| |
|
10 |
| |
|
11 |
| |
|
12 |
| |
|
13 |
| |
|
14 |
| |
|
15 |
| |
|
16 |
| |
|
17 |
| |
|
18 |
| package javax.mail.internet; |
|
19 |
| |
|
20 |
| |
|
21 |
| |
|
22 |
| |
|
23 |
| public class HeaderTokenizer { |
|
24 |
| public static class Token { |
|
25 |
| |
|
26 |
| public static final int ATOM = -1; |
|
27 |
| public static final int COMMENT = -3; |
|
28 |
| public static final int EOF = -4; |
|
29 |
| public static final int QUOTEDSTRING = -2; |
|
30 |
| private int _type; |
|
31 |
| private String _value; |
|
32 |
| |
|
33 |
682
| public Token(int type, String value) {
|
|
34 |
682
| _type = type;
|
|
35 |
682
| _value = value;
|
|
36 |
| } |
|
37 |
| |
|
38 |
923
| public int getType() {
|
|
39 |
923
| return _type;
|
|
40 |
| } |
|
41 |
| |
|
42 |
443
| public String getValue() {
|
|
43 |
443
| return _value;
|
|
44 |
| } |
|
45 |
| } |
|
46 |
| |
|
47 |
| private static final Token EOF = new Token(Token.EOF, null); |
|
48 |
| |
|
49 |
| public static final String MIME = "()<>@,;:\\\"\t []/?="; |
|
50 |
| |
|
51 |
| public static final String RFC822 = "()<>@,;:\\\"\t .[]"; |
|
52 |
| private static final String WHITE = " \t\n\r"; |
|
53 |
| private String _delimiters; |
|
54 |
| private String _header; |
|
55 |
| private boolean _skip; |
|
56 |
| private int pos; |
|
57 |
| |
|
58 |
11
| public HeaderTokenizer(String header) {
|
|
59 |
11
| this(header, RFC822);
|
|
60 |
| } |
|
61 |
| |
|
62 |
325
| public HeaderTokenizer(String header, String delimiters) {
|
|
63 |
325
| this(header, delimiters, true);
|
|
64 |
| } |
|
65 |
| |
|
66 |
341
| public HeaderTokenizer(String header,
|
|
67 |
| String delimiters, |
|
68 |
| boolean skipComments) { |
|
69 |
341
| _skip = skipComments;
|
|
70 |
341
| _header = header;
|
|
71 |
341
| _delimiters = delimiters;
|
|
72 |
| } |
|
73 |
| |
|
74 |
147
| public String getRemainder() {
|
|
75 |
147
| return _header.substring(pos);
|
|
76 |
| } |
|
77 |
| |
|
78 |
838
| public Token next() throws ParseException {
|
|
79 |
838
| return readToken();
|
|
80 |
| } |
|
81 |
| |
|
82 |
7
| public Token peek() throws ParseException {
|
|
83 |
7
| int start = pos;
|
|
84 |
7
| try {
|
|
85 |
7
| return readToken();
|
|
86 |
| } finally { |
|
87 |
7
| pos = start;
|
|
88 |
| } |
|
89 |
| } |
|
90 |
| |
|
91 |
| |
|
92 |
| |
|
93 |
| |
|
94 |
| |
|
95 |
| |
|
96 |
397
| private Token readAtomicToken() {
|
|
97 |
| |
|
98 |
397
| int start = pos;
|
|
99 |
397
| while (++pos < _header.length()) {
|
|
100 |
| |
|
101 |
1947
| char ch = _header.charAt(pos);
|
|
102 |
1947
| if (_delimiters.indexOf(_header.charAt(pos)) != -1 || ch < 32 || ch >= 127) {
|
|
103 |
237
| break;
|
|
104 |
| } |
|
105 |
| } |
|
106 |
| |
|
107 |
397
| return new Token(Token.ATOM, _header.substring(start, pos));
|
|
108 |
| } |
|
109 |
| |
|
110 |
| |
|
111 |
| |
|
112 |
| |
|
113 |
| |
|
114 |
| |
|
115 |
| |
|
116 |
| |
|
117 |
892
| private Token readToken() throws ParseException {
|
|
118 |
892
| if (pos >= _header.length()) {
|
|
119 |
158
| return EOF;
|
|
120 |
| } else { |
|
121 |
734
| char c = _header.charAt(pos);
|
|
122 |
| |
|
123 |
734
| if (c == '(') {
|
|
124 |
15
| Token comment = readComment();
|
|
125 |
11
| if (_skip) {
|
|
126 |
2
| return readToken();
|
|
127 |
| } else { |
|
128 |
9
| return comment;
|
|
129 |
| } |
|
130 |
| |
|
131 |
719
| } else if (c == '\"') {
|
|
132 |
30
| return readQuotedString();
|
|
133 |
| |
|
134 |
689
| } else if (WHITE.indexOf(c) != -1) {
|
|
135 |
45
| eatWhiteSpace();
|
|
136 |
45
| return readToken();
|
|
137 |
| |
|
138 |
644
| } else if (c < 32 || c >= 127 || _delimiters.indexOf(c) != -1) {
|
|
139 |
247
| pos++;
|
|
140 |
247
| return new Token((int)c, String.valueOf(c));
|
|
141 |
| } else { |
|
142 |
| |
|
143 |
397
| return readAtomicToken();
|
|
144 |
| } |
|
145 |
| } |
|
146 |
| } |
|
147 |
| |
|
148 |
| |
|
149 |
| |
|
150 |
| |
|
151 |
| |
|
152 |
| |
|
153 |
| |
|
154 |
| |
|
155 |
| |
|
156 |
| |
|
157 |
| |
|
158 |
5
| private String getEscapedValue(int start, int end) throws ParseException {
|
|
159 |
5
| StringBuffer value = new StringBuffer();
|
|
160 |
| |
|
161 |
5
| for (int i = start; i < end; i++) {
|
|
162 |
15
| char ch = _header.charAt(i);
|
|
163 |
| |
|
164 |
15
| if (ch == '\\') {
|
|
165 |
3
| i++;
|
|
166 |
3
| if (i == end) {
|
|
167 |
0
| throw new ParseException("Invalid escape character");
|
|
168 |
| } |
|
169 |
3
| value.append(_header.charAt(i));
|
|
170 |
| } |
|
171 |
| |
|
172 |
| |
|
173 |
12
| else if (ch == '\r') {
|
|
174 |
| |
|
175 |
2
| if (i < end - 1 && _header.charAt(i + 1) == '\n') {
|
|
176 |
2
| i++;
|
|
177 |
| } |
|
178 |
| } |
|
179 |
| else { |
|
180 |
| |
|
181 |
10
| value.append(ch);
|
|
182 |
| } |
|
183 |
| } |
|
184 |
5
| return value.toString();
|
|
185 |
| } |
|
186 |
| |
|
187 |
| |
|
188 |
| |
|
189 |
| |
|
190 |
| |
|
191 |
| |
|
192 |
| |
|
193 |
| |
|
194 |
15
| private Token readComment() throws ParseException {
|
|
195 |
15
| int start = pos + 1;
|
|
196 |
15
| int nesting = 1;
|
|
197 |
| |
|
198 |
15
| boolean requiresEscaping = false;
|
|
199 |
| |
|
200 |
| |
|
201 |
15
| while (++pos < _header.length()) {
|
|
202 |
142
| char ch = _header.charAt(pos);
|
|
203 |
142
| if (ch == ')') {
|
|
204 |
18
| nesting--;
|
|
205 |
18
| if (nesting == 0) {
|
|
206 |
11
| break;
|
|
207 |
| } |
|
208 |
| } |
|
209 |
124
| else if (ch == '(') {
|
|
210 |
7
| nesting++;
|
|
211 |
| } |
|
212 |
117
| else if (ch == '\\') {
|
|
213 |
1
| pos++;
|
|
214 |
1
| requiresEscaping = true;
|
|
215 |
| } |
|
216 |
| |
|
217 |
116
| else if (ch == '\r') {
|
|
218 |
1
| requiresEscaping = true;
|
|
219 |
| } |
|
220 |
| } |
|
221 |
| |
|
222 |
15
| if (nesting != 0) {
|
|
223 |
4
| throw new ParseException("Unbalanced comments");
|
|
224 |
| } |
|
225 |
| |
|
226 |
11
| String value;
|
|
227 |
11
| if (requiresEscaping) {
|
|
228 |
2
| value = getEscapedValue(start, pos);
|
|
229 |
| } |
|
230 |
| else { |
|
231 |
9
| value = _header.substring(start, pos++);
|
|
232 |
| } |
|
233 |
11
| return new Token(Token.COMMENT, value);
|
|
234 |
| } |
|
235 |
| |
|
236 |
| |
|
237 |
| |
|
238 |
| |
|
239 |
| |
|
240 |
| |
|
241 |
| |
|
242 |
| |
|
243 |
30
| private Token readQuotedString() throws ParseException {
|
|
244 |
30
| int start = pos+1;
|
|
245 |
30
| boolean requiresEscaping = false;
|
|
246 |
| |
|
247 |
| |
|
248 |
30
| while (++pos < _header.length()) {
|
|
249 |
434
| char ch = _header.charAt(pos);
|
|
250 |
434
| if (ch == '"') {
|
|
251 |
26
| String value;
|
|
252 |
26
| if (requiresEscaping) {
|
|
253 |
3
| value = getEscapedValue(start, pos);
|
|
254 |
| } |
|
255 |
| else { |
|
256 |
23
| value = _header.substring(start, pos++);
|
|
257 |
| } |
|
258 |
26
| return new Token(Token.QUOTEDSTRING, value);
|
|
259 |
| } |
|
260 |
408
| else if (ch == '\\') {
|
|
261 |
4
| pos++;
|
|
262 |
4
| requiresEscaping = true;
|
|
263 |
| } |
|
264 |
| |
|
265 |
404
| else if (ch == '\r') {
|
|
266 |
1
| requiresEscaping = true;
|
|
267 |
| } |
|
268 |
| } |
|
269 |
| |
|
270 |
4
| throw new ParseException("Missing '\"'");
|
|
271 |
| } |
|
272 |
| |
|
273 |
| |
|
274 |
| |
|
275 |
| |
|
276 |
45
| private void eatWhiteSpace() {
|
|
277 |
| |
|
278 |
45
| while (++pos < _header.length()
|
|
279 |
| && WHITE.indexOf(_header.charAt(pos)) != -1) |
|
280 |
| ; |
|
281 |
| } |
|
282 |
| } |