File ParseHtmlBodyAndLinks.java

Branches:

Statements:

Methods:

Classes:

LOC:

181

NCLOC:

100

Total complexity:

Complexity density:

0.52

Statements/Method:

Methods/Class:

Average method complexity:

3.14

Classes

Class	Line #	Total Statements	Complexity	Uncovered Elements	TOTAL Coverage	Actions
ParseHtmlBodyAndLinks	34	42	22	9	0.869565287%

Class ParseHtmlBodyAndLinks

Class ParseHtmlBodyAndLinks	Line # 34	Total Statements 42	Complexity 22	Uncovered Elements 9	TOTAL Coverage 0.869565287%
getOrig() : String getOrig() : String	4141	1.01	1.01	1.01	0.0 0.00%
isHtmlContent() : boolean isHtmlContent() : boolean	5151	1.01	1.01	0.00	1.0 1.0100%
getContent() : String getContent() : String	6565	1.01	1.01	0.00	1.0 1.0100%
getLinks() : List<String> getLinks() : List<String>	7676	1.01	1.01	0.00	1.0 1.0100%
ParseHtmlBodyAndLinks(String,boolean,String) ParseHtmlBodyAndLinks(String,boolean,String)	9797	33.033	15.015	7.07	0.8627451 0.862745186.3%
translateEntities(String) : String translateEntities(String) : String	162162	4.04	1.01	0.00	1.0 1.0100%
getNonHtmlContent() : String getNonHtmlContent() : String	176176	1.01	2.02	0.00	1.0 1.0100%

Contributing tests

No tests hitting this source file were found.

Source view

* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)

* Copyright (C) $$Year-Rel$$ The Jalview Authors

* This file is part of Jalview.

* Jalview is free software: you can redistribute it and/or

* modify it under the terms of the GNU General Public License

* as published by the Free Software Foundation, either version 3

* of the License, or (at your option) any later version.

* Jalview is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty

* of MERCHANTABILITY or FITNESS FOR A PARTICULAR

* PURPOSE. See the GNU General Public License for more details.

* You should have received a copy of the GNU General Public License

* along with Jalview. If not, see <http://www.gnu.org/licenses/>.

* The Jalview Authors are detailed in the 'AUTHORS' file.

package jalview.util;

import java.util.ArrayList;

import java.util.List;

import java.util.StringTokenizer;

import java.util.regex.Pattern;

/**

* utility class for dealing with HTML link extraction

* @author jprocter

public class ParseHtmlBodyAndLinks

{

private static final Pattern LEFT_ANGLE_BRACKET_PATTERN = Pattern

.compile("<");

String orig = null;

public String getOrig()

{

return orig;

}

boolean htmlContent = true;

/**

* @return true if the content looked like HTML

331

public boolean isHtmlContent()

{

331

return htmlContent;

}

List<String> links = new ArrayList<String>();

String content;

/**

* result of parsing description - with or without HTML tags

* @return

public String getContent()

{

return content;

}

/**

* list of Label|Link encoded URL links extracted from HTML

* @return

337

public List<String> getLinks()

{

337

return links;

}

/**

* Parses the given html and

* <ul>

* <li>extracts any 'href' links to a list of "displayName|url" strings,

* retrievable by #getLinks</li>

* <li>extracts the remaining text (with %LINK% placeholders replacing hrefs),

* retrievable by #getContent</li>

* </ul>

* @param description

* - html or text content to be parsed

* @param removeHTML

* flag to indicate if HTML tags should be removed if they are

* present.

* @param newline

335

public ParseHtmlBodyAndLinks(String description, boolean removeHTML,

String newline)

{

100

335

if (description == null || description.length() == 0)

{

htmlContent = false;

return;

}

335

StringBuilder sb = new StringBuilder(description.length());

106

335

if (description.toUpperCase().indexOf("<HTML>") == -1)

107

{

108

224

htmlContent = false;

109

}

110

335

orig = description;

111

335

StringTokenizer st = new StringTokenizer(description, "<");

112

335

String token, link;

113

335

int startTag;

114

335

String tag = null;

115

1001

while (st.hasMoreElements())

116

{

117

666

token = st.nextToken(">");

118

666

if (token.equalsIgnoreCase("html") || token.startsWith("/"))

{

continue;

}

666

tag = null;

124

666

startTag = token.indexOf("<");

125

126

666

if (startTag > -1)

127

{

128

442

tag = token.substring(startTag + 1);

129

442

token = token.substring(0, startTag);

130

}

131

132

666

if (tag != null && tag.toUpperCase().startsWith("A HREF="))

133

{

134

110

if (token.length() > 0)

135

{

136

109

sb.append(token);

137

}

138

110

link = tag.substring(tag.indexOf("\"") + 1, tag.length() - 1);

139

110

String label = st.nextToken("<>");

140

110

links.add(label + "|" + link);

141

110

sb.append(label + "%LINK%");

142

}

143

556

else if (tag != null && tag.equalsIgnoreCase("br"))

{

sb.append(newline);

}

else

{

556

sb.append(token);

150

}

151

}

152

335

if (removeHTML && !htmlContent)

153

{

154

// instead of parsing the html into plaintext

155

// clean the description ready for embedding in html

156

221

sb = new StringBuilder(LEFT_ANGLE_BRACKET_PATTERN.matcher(description)

157

.replaceAll("<"));

158

}

159

335

content = translateEntities(sb.toString());

160

}

161

162

335

private String translateEntities(String s)

163

{

164

335

s = s.replaceAll("&", "&");

165

335

s = s.replaceAll("<", "<");

166

335

s = s.replaceAll(">", ">");

167

335

return s;

}

/**

* get either the parsed content or the original, depending on whether the

172

* original looked like html content or not.

* @return

331

public String getNonHtmlContent()

177

{

178

331

return isHtmlContent() ? content : orig;

179

}

180

181

}

jalviewX

File ParseHtmlBodyAndLinks.java

Coverage histogram

Code metrics

Classes

Class ParseHtmlBodyAndLinks

Contributing tests

Source view