File SecondaryStructureDistanceModel.java

Branches:

Statements:

102

Methods:

Classes:

LOC:

395

NCLOC:

246

Total complexity:

Complexity density:

0.44

Statements/Method:

8.5

Methods/Class:

Average method complexity:

3.75

Classes

Class	Line #	Total Statements	Complexity	TOTAL Coverage	Actions
SecondaryStructureDistanceModel	47	102	45	0.892405189.2%

Class SecondaryStructureDistanceModel

Class SecondaryStructureDistanceModel	Line # 47	Total Statements 102	Complexity 45	TOTAL Coverage 0.892405189.2%
SecondaryStructureDistanceModel() SecondaryStructureDistanceModel()	6060	0.00	1.01	-1.0 -1.0 -
getInstance(AlignmentViewPanel) : ScoreModelI getInstance(AlignmentViewPanel) : ScoreModelI	6565	8.08	3.03	0.625 0.62562.5%
configureFromAlignmentView(AlignmentViewPanel) : boolean configureFromAlignmentView(AlignmentViewPanel) : boolean	8585	2.02	1.01	1.0 1.0100%
expandSeqData(SequenceI[],AlignmentView,SimilarityParamsI,List<String>,ArrayList<AlignmentAnnotation>,HashMap<Integer, String>) : SequenceI[] expandSeqData(SequenceI[],AlignmentView,SimilarityParamsI,List<String>,ArrayList<AlignmentAnnotation>,HashMap<Integer, String>) : SequenceI[]	9494	32.032	8.08	0.8863636 0.886363688.6%
findDistances(AlignmentView,SimilarityParamsI) : MatrixI findDistances(AlignmentView,SimilarityParamsI) : MatrixI	192192	48.048	24.024	0.9358974 0.935897493.6%
findSeqsWithoutGapAtColumn(SeqCigar[],int) : Set<SeqCigar> findSeqsWithoutGapAtColumn(SeqCigar[],int) : Set<SeqCigar>	341341	6.06	2.02	1.0 1.0100%
getName() : String getName() : String	359359	1.01	1.01	1.0 1.0100%
getDescription() : String getDescription() : String	365365	1.01	1.01	0.0 0.00%
isDNA() : boolean isDNA() : boolean	371371	1.01	1.01	1.0 1.0100%
isProtein() : boolean isProtein() : boolean	377377	1.01	1.01	1.0 1.0100%
isSecondaryStructure() : boolean isSecondaryStructure() : boolean	383383	1.01	1.01	1.0 1.0100%
toString() : String toString() : String	389389	1.01	1.01	0.0 0.00%

Contributing tests

This file is covered by 10 tests. .

Contributing tests

Test contribution	Test	Result
0.8164557	jalview.project.Jalview2xmlTests.testSaveAndLoadAnnotationBasedTreejalview.project.Jalview2xmlTests.testSaveAndLoadAnnotationBasedTree	1PASS
0.60126585	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInEitherOneSeqjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInEitherOneSeq	1PASS
0.60126585	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withGapjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withGap	1PASS
0.60126585	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInBothSeqsjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInBothSeqs	1PASS
0.5886076	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.5886076	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.5886076	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.5886076	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.050632913	jalview.gui.CalculationChooserTest.testGetApplicableScoreModelsjalview.gui.CalculationChooserTest.testGetApplicableScoreModels	1PASS
0.012658228	jalview.analysis.scoremodels.ScoreModelsTest.testConstructorjalview.analysis.scoremodels.ScoreModelsTest.testConstructor	1PASS

Source view

* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)

* Copyright (C) $$Year-Rel$$ The Jalview Authors

* This file is part of Jalview.

* Jalview is free software: you can redistribute it and/or

* modify it under the terms of the GNU General Public License

* as published by the Free Software Foundation, either version 3

* of the License, or (at your option) any later version.

* Jalview is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty

* of MERCHANTABILITY or FITNESS FOR A PARTICULAR

* PURPOSE. See the GNU General Public License for more details.

* You should have received a copy of the GNU General Public License

* along with Jalview. If not, see <http://www.gnu.org/licenses/>.

* The Jalview Authors are detailed in the 'AUTHORS' file.

package jalview.analysis.scoremodels;

import jalview.analysis.AlignmentAnnotationUtils;

import jalview.analysis.AlignmentUtils;

import jalview.api.AlignmentViewPanel;

import jalview.api.FeatureRenderer;

import jalview.api.analysis.ScoreModelI;

import jalview.api.analysis.SimilarityParamsI;

import jalview.datamodel.AlignmentAnnotation;

import jalview.datamodel.AlignmentView;

import jalview.datamodel.SeqCigar;

import jalview.datamodel.SequenceI;

import jalview.math.Matrix;

import jalview.math.MatrixI;

import jalview.util.Constants;

import java.util.ArrayList;

import java.util.HashMap;

import java.util.HashSet;

import java.util.List;

import java.util.Map;

import java.util.Set;

/* This class contains methods to calculate distance score between

* secondary structure annotations of the sequences.

public class SecondaryStructureDistanceModel extends DistanceScoreModel

{

private static final String NAME = "Secondary Structure Similarity";

private ScoreMatrix ssRateMatrix;

private String description;

FeatureRenderer fr;

/**

* Constructor

104

public SecondaryStructureDistanceModel()

{

}

@Override

public ScoreModelI getInstance(AlignmentViewPanel view)

{

SecondaryStructureDistanceModel instance;

try

{

instance = this.getClass().getDeclaredConstructor().newInstance();

instance.configureFromAlignmentView(view);

return instance;

} catch (InstantiationException | IllegalAccessException e)

{

jalview.bin.Console.errPrintln("Error in " + getClass().getName()

+ ".getInstance(): " + e.getMessage());

return null;

} catch (ReflectiveOperationException roe)

{

return null;

}

boolean configureFromAlignmentView(AlignmentViewPanel view)

{

fr = view.cloneFeatureRenderer();

return true;

}

ArrayList<AlignmentAnnotation> ssForSeqs = null;

@Override

public SequenceI[] expandSeqData(SequenceI[] sequences,

AlignmentView seqData, SimilarityParamsI scoreParams,

List<String> labels, ArrayList<AlignmentAnnotation> ssAnnotationForSeqs,

HashMap<Integer, String> annotationDetails)

{

100

ssForSeqs = new ArrayList<AlignmentAnnotation>();

101

List<SequenceI> newSequences = new ArrayList<SequenceI>();

102

List<SeqCigar> newCigs = new ArrayList<SeqCigar>();

103

int sq = 0;

104

105

AlignmentAnnotation[] alignAnnotList = fr.getViewport().getAlignment()

106

.getAlignmentAnnotation();

107

108

String ssSource = scoreParams.getSecondaryStructureSource();

109

if (ssSource == null || ssSource == "")

110

{

111

ssSource = Constants.SS_ALL_PROVIDERS;

}

* Add secondary structure annotations that are added to the annotation track

116

* to the map

117

118

Map<SequenceI, ArrayList<AlignmentAnnotation>> ssAlignmentAnnotationForSequences = AlignmentUtils

119

.getSequenceAssociatedAlignmentAnnotations(alignAnnotList,

120

ssSource);

121

122

for (SeqCigar scig : seqData.getSequences())

123

{

124

// get the next sequence that should be bound to this scig: may be null

125

SequenceI alSeq = sequences[sq++];

126

List<AlignmentAnnotation> ssec = ssAlignmentAnnotationForSequences

127

.get(scig.getRefSeq());

if (ssec == null)

{

// not defined

newSequences.add(alSeq);

132

if (alSeq != null)

133

{

134

//labels.add("No Secondary Structure");

135

labels.add(Constants.STRUCTURE_PROVIDERS.get("None"));

136

}

137

SeqCigar newSeqCigar = scig; // new SeqCigar(scig);

138

newCigs.add(newSeqCigar);

ssForSeqs.add(null);

}

else

{

for (int i = 0; i < ssec.size(); i++)

{

if (alSeq != null)

{

// Add annotationDetails if the annotation has

148

// ANNOTATION_DETAILS property value (additional metadata)

149

150

if (ssec.get(i).hasAnnotationDetailsProperty())

151

{

152

// using key = labels.size() gives the position of the node

153

annotationDetails.put(labels.size(), ssec.get(i).getAnnotationDetailsProperty());

154

}

155

156

String provider = AlignmentAnnotationUtils

157

.extractSSSourceFromAnnotationDescription(ssec.get(i));

158

labels.add(provider);

159

}

160

newSequences.add(alSeq);

161

SeqCigar newSeqCigar = scig; // new SeqCigar(scig);

162

newCigs.add(newSeqCigar);

163

ssForSeqs.add(ssec.get(i));

}

}

}

ssAnnotationForSeqs.addAll(ssForSeqs);

168

seqData.setSequences(newCigs.toArray(new SeqCigar[0]));

169

return newSequences.toArray(new SequenceI[0]);

}

/**

* Calculates distance score [i][j] between each pair of protein sequences

175

* based on their secondary structure annotations (H, E, C). The final score

176

* is normalised by the number of alignment columns processed, providing an

177

* average similarity score.

178

* <p>

179

* The parameters argument can include settings for handling gap-residue

180

* aligned positions and may determine if the score calculation is based on

181

* the longer or shorter sequence in each pair. This can be important for

182

* handling partial alignments or sequences of significantly different

* lengths.

* @param seqData

* The aligned sequence data including secondary structure

187

* annotations.

188

* @param params

189

* Additional parameters for customising the scoring process, such as

190

* gap handling and sequence length consideration.

191

192

@Override

193

public MatrixI findDistances(AlignmentView seqData,

194

SimilarityParamsI params)

195

{

196

if (ssForSeqs == null

197

|| ssForSeqs.size() != seqData.getSequences().length)

198

{

199

// expandSeqData needs to be called to initialise the hash

200

SequenceI[] sequences = new SequenceI[seqData.getSequences().length];

201

// we throw away the new labels in this case..

202

expandSeqData(sequences, seqData, params, new ArrayList<String>(),

203

new ArrayList<AlignmentAnnotation>(), new HashMap<Integer, String>());

204

}

205

SeqCigar[] seqs = seqData.getSequences();

206

int noseqs = seqs.length; // no of sequences

207

int cpwidth = 0;

208

double[][] similarities = new double[noseqs][noseqs]; // matrix to store

209

// similarity score

210

// secondary structure source parameter selected by the user from the drop

211

// down.

212

String ssSource = params.getSecondaryStructureSource();

213

if (ssSource == null || ssSource == "")

214

{

215

ssSource = Constants.SS_ALL_PROVIDERS;

216

}

217

ssRateMatrix = ScoreModels.getInstance().getSecondaryStructureMatrix();

218

219

// need to get real position for view position

220

int[] viscont = seqData.getVisibleContigs();

221

222

223

* scan each column, compute and add to each similarity[i, j]

224

* the number of secondary structure annotation that seqi

225

* and seqj do not share

226

227

for (int vc = 0; vc < viscont.length; vc += 2)

228

{

229

// Iterates for each column position

230

152

for (int cpos = viscont[vc]; cpos <= viscont[vc + 1]; cpos++)

231

{

232

141

cpwidth++; // used to normalise the similarity score

233

234

235

* get set of sequences without gap in the current column

236

237

141

Set<SeqCigar> seqsWithoutGapAtCol = findSeqsWithoutGapAtColumn(seqs,

cpos);

* calculate similarity score for each secondary structure annotation on i'th and j'th

242

* sequence and add this measure to the similarities matrix

243

* for [i, j] for j > i

244

245

1898

for (int i = 0; i < (noseqs - 1); i++)

246

{

247

1757

AlignmentAnnotation aa_i = ssForSeqs.get(i);

248

1757

boolean undefinedSS1 = aa_i == null;

249

// check if the sequence contains gap in the current column

250

1757

boolean gap1 = !seqsWithoutGapAtCol.contains(seqs[i]);

251

// secondary structure is fetched only if the current column is not

252

// gap for the sequence

253

1757

char ss1 = '*';

254

1757

if (!gap1 && !undefinedSS1)

255

{

256

// fetch the position in sequence for the column and finds the

257

// corresponding secondary structure annotation

258

// TO DO - consider based on priority and displayed

259

376

int seqPosition_i = seqs[i].findPosition(cpos);

260

376

if (aa_i != null)

261

376

ss1 = AlignmentUtils.findSSAnnotationForGivenSeqposition(aa_i,

262

seqPosition_i);

263

}

264

// Iterates for each sequences

265

17250

for (int j = i + 1; j < noseqs; j++)

266

{

267

268

// check if ss is defined

269

15493

AlignmentAnnotation aa_j = ssForSeqs.get(j);

270

15493

boolean undefinedSS2 = aa_j == null;

271

272

// Set similarity to max score if both SS are not defined

273

15493

if (undefinedSS1 && undefinedSS2)

274

{

275

9231

similarities[i][j] += ssRateMatrix.getMaximumScore();

276

9231

continue;

277

}

278

279

// Set similarity to minimum score if either one SS is not defined

280

6262

else if (undefinedSS1 || undefinedSS2)

281

{

282

5656

similarities[i][j] += ssRateMatrix.getMinimumScore();

283

5656

continue;

284

}

285

286

606

boolean gap2 = !seqsWithoutGapAtCol.contains(seqs[j]);

287

288

// Variable to store secondary structure at the current column

289

606

char ss2 = '*';

290

291

606

if (!gap2 && !undefinedSS2)

292

{

293

564

int seqPosition = seqs[j].findPosition(cpos);

294

295

564

if (aa_j != null)

296

564

ss2 = AlignmentUtils.findSSAnnotationForGivenSeqposition(

aa_j, seqPosition);

}

606

if ((!gap1 && !gap2) || params.includeGaps())

301

{

302

// Calculate similarity score based on the substitution matrix

303

606

double similarityScore = ssRateMatrix.getPairwiseScore(ss1,

304

ss2);

305

606

similarities[i][j] += similarityScore;

}

}

}

}

}

* normalise the similarity scores (summed over columns) by the

314

* number of visible columns used in the calculation

315

* and fill in the bottom half of the matrix

316

317

// TODO JAL-2424 cpwidth may be out by 1 - affects scores but not tree shape

318

319

for (int i = 0; i < noseqs; i++)

320

{

321

201

for (int j = i + 1; j < noseqs; j++)

322

{

323

163

similarities[i][j] /= cpwidth;

324

163

similarities[j][i] = similarities[i][j];

325

}

326

}

327

return SimilarityScoreModel

328

.similarityToDistance(new Matrix(similarities));

}

/**

* Builds and returns a set containing sequences (SeqCigar) which do not have

334

* a gap at the given column position.

335

336

* @param seqs

337

* @param columnPosition

* (0..)

* @return

141

private Set<SeqCigar> findSeqsWithoutGapAtColumn(SeqCigar[] seqs,

342

int columnPosition)

343

{

344

141

Set<SeqCigar> seqsWithoutGapAtCol = new HashSet<>();

345

141

for (SeqCigar seq : seqs)

346

{

347

1898

int spos = seq.findPosition(columnPosition);

348

1898

if (spos != -1)

349

{

350

351

* position is not a gap

352

353

1587

seqsWithoutGapAtCol.add(seq);

354

}

355

}

356

141

return seqsWithoutGapAtCol;

357

}

358

359

189

@Override

360

public String getName()

361

{

362

189

return NAME;

}

@Override

public String getDescription()

{

return description;

}

@Override

public boolean isDNA()

{

return false;

}

@Override

public boolean isProtein()

{

return false;

}

@Override

public boolean isSecondaryStructure()

{

return true;

}

@Override

public String toString()

391

{

392

return "Score between sequences based on similarity between binary "

393

+ "vectors marking secondary structure displayed at each column";

394

}

395

}

Coverage Report

File SecondaryStructureDistanceModel.java

Coverage histogram

Code metrics

Classes

Class SecondaryStructureDistanceModel

Contributing tests

Contributing tests

Source view