1 |
|
|
2 |
|
|
3 |
|
|
4 |
|
|
5 |
|
|
6 |
|
|
7 |
|
|
8 |
|
|
9 |
|
|
10 |
|
|
11 |
|
|
12 |
|
|
13 |
|
|
14 |
|
|
15 |
|
|
16 |
|
|
17 |
|
|
18 |
|
|
19 |
|
|
20 |
|
|
21 |
|
package jalview.util; |
22 |
|
|
23 |
|
import java.util.ArrayList; |
24 |
|
import java.util.List; |
25 |
|
import java.util.StringTokenizer; |
26 |
|
import java.util.regex.Pattern; |
27 |
|
|
28 |
|
|
29 |
|
|
30 |
|
|
31 |
|
@author |
32 |
|
|
33 |
|
|
|
|
| 87% |
Uncovered Elements: 9 (69) |
Complexity: 22 |
Complexity Density: 0.52 |
|
34 |
|
public class ParseHtmlBodyAndLinks |
35 |
|
{ |
36 |
|
private static final Pattern LEFT_ANGLE_BRACKET_PATTERN = Pattern |
37 |
|
.compile("<"); |
38 |
|
|
39 |
|
String orig = null; |
40 |
|
|
|
|
| 0% |
Uncovered Elements: 1 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
41 |
0 |
public String getOrig()... |
42 |
|
{ |
43 |
0 |
return orig; |
44 |
|
} |
45 |
|
|
46 |
|
boolean htmlContent = true; |
47 |
|
|
48 |
|
|
49 |
|
@return |
50 |
|
|
|
|
| 100% |
Uncovered Elements: 0 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
51 |
331 |
public boolean isHtmlContent()... |
52 |
|
{ |
53 |
331 |
return htmlContent; |
54 |
|
} |
55 |
|
|
56 |
|
List<String> links = new ArrayList<String>(); |
57 |
|
|
58 |
|
String content; |
59 |
|
|
60 |
|
|
61 |
|
|
62 |
|
|
63 |
|
@return |
64 |
|
|
|
|
| 100% |
Uncovered Elements: 0 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
65 |
5 |
public String getContent()... |
66 |
|
{ |
67 |
|
|
68 |
5 |
return content; |
69 |
|
} |
70 |
|
|
71 |
|
|
72 |
|
|
73 |
|
|
74 |
|
@return |
75 |
|
|
|
|
| 100% |
Uncovered Elements: 0 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
76 |
337 |
public List<String> getLinks()... |
77 |
|
{ |
78 |
337 |
return links; |
79 |
|
} |
80 |
|
|
81 |
|
|
82 |
|
|
83 |
|
|
84 |
|
|
85 |
|
|
86 |
|
|
87 |
|
|
88 |
|
|
89 |
|
|
90 |
|
@param |
91 |
|
|
92 |
|
@param |
93 |
|
|
94 |
|
|
95 |
|
@param |
96 |
|
|
|
|
| 86.3% |
Uncovered Elements: 7 (51) |
Complexity: 15 |
Complexity Density: 0.45 |
|
97 |
335 |
public ParseHtmlBodyAndLinks(String description, boolean removeHTML,... |
98 |
|
String newline) |
99 |
|
{ |
100 |
335 |
if (description == null || description.length() == 0) |
101 |
|
{ |
102 |
0 |
htmlContent = false; |
103 |
0 |
return; |
104 |
|
} |
105 |
335 |
StringBuilder sb = new StringBuilder(description.length()); |
106 |
335 |
if (description.toUpperCase().indexOf("<HTML>") == -1) |
107 |
|
{ |
108 |
224 |
htmlContent = false; |
109 |
|
} |
110 |
335 |
orig = description; |
111 |
335 |
StringTokenizer st = new StringTokenizer(description, "<"); |
112 |
335 |
String token, link; |
113 |
335 |
int startTag; |
114 |
335 |
String tag = null; |
115 |
1001 |
while (st.hasMoreElements()) |
116 |
|
{ |
117 |
666 |
token = st.nextToken(">"); |
118 |
666 |
if (token.equalsIgnoreCase("html") || token.startsWith("/")) |
119 |
|
{ |
120 |
0 |
continue; |
121 |
|
} |
122 |
|
|
123 |
666 |
tag = null; |
124 |
666 |
startTag = token.indexOf("<"); |
125 |
|
|
126 |
666 |
if (startTag > -1) |
127 |
|
{ |
128 |
442 |
tag = token.substring(startTag + 1); |
129 |
442 |
token = token.substring(0, startTag); |
130 |
|
} |
131 |
|
|
132 |
666 |
if (tag != null && tag.toUpperCase().startsWith("A HREF=")) |
133 |
|
{ |
134 |
110 |
if (token.length() > 0) |
135 |
|
{ |
136 |
109 |
sb.append(token); |
137 |
|
} |
138 |
110 |
link = tag.substring(tag.indexOf("\"") + 1, tag.length() - 1); |
139 |
110 |
String label = st.nextToken("<>"); |
140 |
110 |
links.add(label + "|" + link); |
141 |
110 |
sb.append(label + "%LINK%"); |
142 |
|
} |
143 |
556 |
else if (tag != null && tag.equalsIgnoreCase("br")) |
144 |
|
{ |
145 |
0 |
sb.append(newline); |
146 |
|
} |
147 |
|
else |
148 |
|
{ |
149 |
556 |
sb.append(token); |
150 |
|
} |
151 |
|
} |
152 |
335 |
if (removeHTML && !htmlContent) |
153 |
|
{ |
154 |
|
|
155 |
|
|
156 |
221 |
sb = new StringBuilder(LEFT_ANGLE_BRACKET_PATTERN.matcher(description) |
157 |
|
.replaceAll("<")); |
158 |
|
} |
159 |
335 |
content = translateEntities(sb.toString()); |
160 |
|
} |
161 |
|
|
|
|
| 100% |
Uncovered Elements: 0 (4) |
Complexity: 1 |
Complexity Density: 0.25 |
|
162 |
335 |
private String translateEntities(String s)... |
163 |
|
{ |
164 |
335 |
s = s.replaceAll("&", "&"); |
165 |
335 |
s = s.replaceAll("<", "<"); |
166 |
335 |
s = s.replaceAll(">", ">"); |
167 |
335 |
return s; |
168 |
|
} |
169 |
|
|
170 |
|
|
171 |
|
|
172 |
|
|
173 |
|
|
174 |
|
@return |
175 |
|
|
|
|
| 100% |
Uncovered Elements: 0 (3) |
Complexity: 2 |
Complexity Density: 2 |
|
176 |
331 |
public String getNonHtmlContent()... |
177 |
|
{ |
178 |
331 |
return isHtmlContent() ? content : orig; |
179 |
|
} |
180 |
|
|
181 |
|
} |