summaryrefslogtreecommitdiffstats
path: root/parsers/SymbolMap.java
blob: 752fcf6ef04a5689151117e641f164161a959069 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
/*+
 *   Copyright 2012 rsiddharth
 *   Email: <rsiddharth@ninthfloor.org> 
 * 
 *   This file is part of Scruf.
 *
 *   Scruf is free software: you can redistribute it and/or modify
 *   it under the terms of the GNU General Public License as published by
 *   the Free Software Foundation, either version 3 of the License, or
 *   (at your option) any later version.
 *
 *   This program is distributed in the hope that it will be useful,
 *   but WITHOUT ANY WARRANTY; without even the implied warranty of
 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *   GNU General Public License for more details.
 *
 *   You should have received a copy of the GNU General Public License
 *   along with this program.  If not, see <http://www.gnu.org/licenses/>.
 */



package scruf.parsers;

import java.util.regex.*;
import java.util.*;

/**
 * Map of Symbols & their HTML equivalent numbers.
 */
public class SymbolMap extends HashMap<String, String> {
	public SymbolMap() {
		put("!","&#33;");
		put("\"","&#34;");
		put("#","&#35;");
		put("$","&#36;");
		put("%","&#37;");
		put("&","&#38;");
		put("'","&#39;");
		put("(","&#40;");
		put(")","&#41;");
		put("*","&#42;");
		put("+","&#43;");
		put(",","&#44;");
		put("-","&#45;");
		put(".","&#46;");
		put("/","&#47;");
		put(":","&#58;");
		put(";","&#59;");
		put("<","&#60;");
		put("=","&#61;");
		put(">","&#62;");
		put("?","&#63;");
		put("@","&#64;");
		put("[","&#91;");
		put("\\","&#92;");
		put("]","&#93;");
		put("^","&#94;");
		put("_","&#95;");
		put("`","&#96;");
		put("{","&#123;");
		put("|","&#124;");
		put("}","&#125;");
		put("~","&#126;");
	}
	/**
     * this method quotes symbols to a HTML number.
     */
    public String quote(String string) {
	Pattern pattern = Pattern.compile("(\\&(amp|lt|gt|(\\#35))\\;)|(\\p{Punct})");
	Matcher matcher = pattern.matcher(string);
	StringBuffer sbuffer = new StringBuffer();
	while(matcher.find()) {
		if(matcher.group(4)!=null) {
			matcher.appendReplacement(sbuffer,
									  this.get(matcher.group()));
		}
	}
	matcher.appendTail(sbuffer);
	return sbuffer.toString();
    }
}