File ParseHtmlBodyAndLinks.java

Branches:

Statements:

Methods:

Classes:

LOC:

183

NCLOC:

101

Total complexity:

Complexity density:

0.52

Statements/Method:

Methods/Class:

Average method complexity:

3.14

Classes

Class	Line #	Total Statements	Complexity	TOTAL Coverage	Actions
ParseHtmlBodyAndLinks	36	42	22	0.00%

Class ParseHtmlBodyAndLinks

Class ParseHtmlBodyAndLinks	Line # 36	Total Statements 42	Complexity 22	TOTAL Coverage 0.00%
getOrig() : String getOrig() : String	4343	1.01	1.01	0.0 0.00%
isHtmlContent() : boolean isHtmlContent() : boolean	5353	1.01	1.01	0.0 0.00%
getContent() : String getContent() : String	6767	1.01	1.01	0.0 0.00%
getLinks() : List<String> getLinks() : List<String>	7878	1.01	1.01	0.0 0.00%
ParseHtmlBodyAndLinks(String,boolean,String) ParseHtmlBodyAndLinks(String,boolean,String)	9999	33.033	15.015	0.0 0.00%
translateEntities(String) : String translateEntities(String) : String	164164	4.04	1.01	0.0 0.00%
getNonHtmlContent() : String getNonHtmlContent() : String	178178	1.01	2.02	0.0 0.00%

Contributing tests

No tests hitting this source file were found.

Source view

* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)

* Copyright (C) $$Year-Rel$$ The Jalview Authors

* This file is part of Jalview.

* Jalview is free software: you can redistribute it and/or

* modify it under the terms of the GNU General Public License

* as published by the Free Software Foundation, either version 3

* of the License, or (at your option) any later version.

* Jalview is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty

* of MERCHANTABILITY or FITNESS FOR A PARTICULAR

* PURPOSE. See the GNU General Public License for more details.

* You should have received a copy of the GNU General Public License

* along with Jalview. If not, see <http://www.gnu.org/licenses/>.

* The Jalview Authors are detailed in the 'AUTHORS' file.

package jalview.util;

import java.util.Locale;

import java.util.ArrayList;

import java.util.List;

import java.util.StringTokenizer;

import java.util.regex.Pattern;

/**

* utility class for dealing with HTML link extraction

* @author jprocter

public class ParseHtmlBodyAndLinks

{

private static final Pattern LEFT_ANGLE_BRACKET_PATTERN = Pattern

.compile("<");

String orig = null;

public String getOrig()

{

return orig;

}

boolean htmlContent = true;

/**

* @return true if the content looked like HTML

public boolean isHtmlContent()

{

return htmlContent;

}

List<String> links = new ArrayList<String>();

String content;

/**

* result of parsing description - with or without HTML tags

* @return

public String getContent()

{

return content;

}

/**

* list of Label|Link encoded URL links extracted from HTML

* @return

public List<String> getLinks()

{

return links;

}

/**

* Parses the given html and

* <ul>

* <li>extracts any 'href' links to a list of "displayName|url" strings,

* retrievable by #getLinks</li>

* <li>extracts the remaining text (with %LINK% placeholders replacing hrefs),

* retrievable by #getContent</li>

* </ul>

* @param description

* - html or text content to be parsed

* @param removeHTML

* flag to indicate if HTML tags should be removed if they are

* present.

* @param newline

public ParseHtmlBodyAndLinks(String description, boolean removeHTML,

100

String newline)

101

{

102

if (description == null || description.length() == 0)

{

htmlContent = false;

return;

}

StringBuilder sb = new StringBuilder(description.length());

108

if (description.toUpperCase(Locale.ROOT).indexOf("<HTML>") == -1)

{

htmlContent = false;

}

orig = description;

StringTokenizer st = new StringTokenizer(description, "<");

String token, link;

int startTag;

String tag = null;

while (st.hasMoreElements())

118

{

119

token = st.nextToken(">");

120

if (token.equalsIgnoreCase("html") || token.startsWith("/"))

{

continue;

}

tag = null;

startTag = token.indexOf("<");

if (startTag > -1)

{

tag = token.substring(startTag + 1);

131

token = token.substring(0, startTag);

132

}

133

134

if (tag != null && tag.toUpperCase(Locale.ROOT).startsWith("A HREF="))

135

{

136

if (token.length() > 0)

{

sb.append(token);

}

link = tag.substring(tag.indexOf("\"") + 1, tag.length() - 1);

141

String label = st.nextToken("<>");

142

links.add(label + "|" + link);

143

sb.append(label + "%LINK%");

144

}

145

else if (tag != null && tag.equalsIgnoreCase("br"))

{

sb.append(newline);

}

else

{

sb.append(token);

}

}

if (removeHTML && !htmlContent)

155

{

156

// instead of parsing the html into plaintext

157

// clean the description ready for embedding in html

158

sb = new StringBuilder(LEFT_ANGLE_BRACKET_PATTERN.matcher(description)

159

.replaceAll("<"));

160

}

161

content = translateEntities(sb.toString());

162

}

163

164

private String translateEntities(String s)

165

{

166

s = s.replaceAll("&", "&");

167

s = s.replaceAll("<", "<");

168

s = s.replaceAll(">", ">");

return s;

}

/**

* get either the parsed content or the original, depending on whether the

174

* original looked like html content or not.

* @return

public String getNonHtmlContent()

179

{

180

return isHtmlContent() ? content : orig;

181

}

182

183

}

Coverage Report

File ParseHtmlBodyAndLinks.java

Coverage histogram

Code metrics

Classes

Class ParseHtmlBodyAndLinks

Contributing tests

Source view