File SecondaryStructureDistanceModel.java

Branches:

Statements:

104

Methods:

Classes:

LOC:

400

NCLOC:

250

Total complexity:

Complexity density:

0.45

Statements/Method:

8.67

Methods/Class:

Average method complexity:

3.92

Classes

Class	Line #	Total Statements	Complexity	TOTAL Coverage	Actions
SecondaryStructureDistanceModel	47	104	47	0.8827160688.3%

Class SecondaryStructureDistanceModel

Class SecondaryStructureDistanceModel	Line # 47	Total Statements 104	Complexity 47	TOTAL Coverage 0.8827160688.3%
SecondaryStructureDistanceModel() SecondaryStructureDistanceModel()	6060	0.00	1.01	-1.0 -1.0 -
getInstance(AlignmentViewPanel) : ScoreModelI getInstance(AlignmentViewPanel) : ScoreModelI	6565	8.08	3.03	0.625 0.62562.5%
configureFromAlignmentView(AlignmentViewPanel) : boolean configureFromAlignmentView(AlignmentViewPanel) : boolean	8585	2.02	1.01	1.0 1.0100%
expandSeqData(SequenceI[],AlignmentView,SimilarityParamsI,List<String>,ArrayList<AlignmentAnnotation>,HashMap<Integer, String>) : SequenceI[] expandSeqData(SequenceI[],AlignmentView,SimilarityParamsI,List<String>,ArrayList<AlignmentAnnotation>,HashMap<Integer, String>) : SequenceI[]	9494	34.034	10.010	0.8541667 0.854166785.4%
findDistances(AlignmentView,SimilarityParamsI) : MatrixI findDistances(AlignmentView,SimilarityParamsI) : MatrixI	197197	48.048	24.024	0.9358974 0.935897493.6%
findSeqsWithoutGapAtColumn(SeqCigar[],int) : Set<SeqCigar> findSeqsWithoutGapAtColumn(SeqCigar[],int) : Set<SeqCigar>	346346	6.06	2.02	1.0 1.0100%
getName() : String getName() : String	364364	1.01	1.01	1.0 1.0100%
getDescription() : String getDescription() : String	370370	1.01	1.01	0.0 0.00%
isDNA() : boolean isDNA() : boolean	376376	1.01	1.01	1.0 1.0100%
isProtein() : boolean isProtein() : boolean	382382	1.01	1.01	1.0 1.0100%
isSecondaryStructure() : boolean isSecondaryStructure() : boolean	388388	1.01	1.01	1.0 1.0100%
toString() : String toString() : String	394394	1.01	1.01	0.0 0.00%

Contributing tests

This file is covered by 12 tests. .

Contributing tests

Test contribution	Test	Result
0.80864197	jalview.project.Jalview2xmlTests.testSaveAndLoadAnnotationBasedTreejalview.project.Jalview2xmlTests.testSaveAndLoadAnnotationBasedTree	1PASS
0.59876543	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInEitherOneSeqjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInEitherOneSeq	1PASS
0.59876543	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInBothSeqsjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInBothSeqs	1PASS
0.59876543	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withGapjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withGap	1PASS
0.58641976	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.58641976	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.58641976	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.58641976	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.049382716	jalview.gui.CalculationChooserTest.testGetApplicableScoreModelsjalview.gui.CalculationChooserTest.testGetApplicableScoreModels	1PASS
0.018518519	jalview.io.cache.JvCacheableInputBoxTest.updateCacheTestjalview.io.cache.JvCacheableInputBoxTest.updateCacheTest	1PASS
0.018518519	jalview.io.ScoreMatrixFileTest.testParse_ncbiFormatjalview.io.ScoreMatrixFileTest.testParse_ncbiFormat	1PASS
0.012345679	jalview.analysis.scoremodels.ScoreModelsTest.testConstructorjalview.analysis.scoremodels.ScoreModelsTest.testConstructor	1PASS

Source view

* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)

* Copyright (C) $$Year-Rel$$ The Jalview Authors

* This file is part of Jalview.

* Jalview is free software: you can redistribute it and/or

* modify it under the terms of the GNU General Public License

* as published by the Free Software Foundation, either version 3

* of the License, or (at your option) any later version.

* Jalview is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty

* of MERCHANTABILITY or FITNESS FOR A PARTICULAR

* PURPOSE. See the GNU General Public License for more details.

* You should have received a copy of the GNU General Public License

* along with Jalview. If not, see <http://www.gnu.org/licenses/>.

* The Jalview Authors are detailed in the 'AUTHORS' file.

package jalview.analysis.scoremodels;

import jalview.analysis.AlignmentAnnotationUtils;

import jalview.analysis.AlignmentUtils;

import jalview.api.AlignmentViewPanel;

import jalview.api.FeatureRenderer;

import jalview.api.analysis.ScoreModelI;

import jalview.api.analysis.SimilarityParamsI;

import jalview.datamodel.AlignmentAnnotation;

import jalview.datamodel.AlignmentView;

import jalview.datamodel.SeqCigar;

import jalview.datamodel.SequenceI;

import jalview.math.Matrix;

import jalview.math.MatrixI;

import jalview.util.Constants;

import java.util.ArrayList;

import java.util.HashMap;

import java.util.HashSet;

import java.util.List;

import java.util.Map;

import java.util.Set;

/* This class contains methods to calculate distance score between

* secondary structure annotations of the sequences.

public class SecondaryStructureDistanceModel extends DistanceScoreModel

{

private static final String NAME = "Secondary Structure Similarity";

private ScoreMatrix ssRateMatrix;

private String description;

FeatureRenderer fr;

/**

* Constructor

public SecondaryStructureDistanceModel()

{

}

@Override

public ScoreModelI getInstance(AlignmentViewPanel view)

{

SecondaryStructureDistanceModel instance;

try

{

instance = this.getClass().getDeclaredConstructor().newInstance();

instance.configureFromAlignmentView(view);

return instance;

} catch (InstantiationException | IllegalAccessException e)

{

jalview.bin.Console.errPrintln("Error in " + getClass().getName()

+ ".getInstance(): " + e.getMessage());

return null;

} catch (ReflectiveOperationException roe)

{

return null;

}

boolean configureFromAlignmentView(AlignmentViewPanel view)

{

fr = view.cloneFeatureRenderer();

return true;

}

ArrayList<AlignmentAnnotation> ssForSeqs = null;

@Override

public SequenceI[] expandSeqData(SequenceI[] sequences,

AlignmentView seqData, SimilarityParamsI scoreParams,

List<String> labels, ArrayList<AlignmentAnnotation> ssAnnotationForSeqs,

HashMap<Integer, String> annotationDetails)

{

100

ssForSeqs = new ArrayList<AlignmentAnnotation>();

101

List<SequenceI> newSequences = new ArrayList<SequenceI>();

102

List<SeqCigar> newCigs = new ArrayList<SeqCigar>();

103

int sq = 0;

104

105

AlignmentAnnotation[] alignAnnotList = fr.getViewport().getAlignment()

106

.getAlignmentAnnotation();

107

108

String ssSource = scoreParams.getSecondaryStructureSource();

109

if (ssSource == null || ssSource == "")

110

{

111

ssSource = Constants.SS_ALL_PROVIDERS;

}

* Add secondary structure annotations that are added to the annotation track

116

* to the map

117

118

Map<SequenceI, ArrayList<AlignmentAnnotation>> ssAlignmentAnnotationForSequences = AlignmentUtils

119

.getSequenceAssociatedAlignmentAnnotations(alignAnnotList,

120

ssSource);

121

122

for (SeqCigar scig : seqData.getSequences())

123

{

124

// get the next sequence that should be bound to this scig: may be null

125

SequenceI alSeq = sequences[sq++];

126

List<AlignmentAnnotation> ssec = ssAlignmentAnnotationForSequences

127

.get(scig.getRefSeq());

128

129

if (ssec == null && scoreParams.getExcludeSeqWithoutAnnot())

{

continue;

}

else if (ssec == null)

134

{

135

// not defined

136

newSequences.add(alSeq);

137

if (alSeq != null)

138

{

139

//labels.add("No Secondary Structure");

140

labels.add(Constants.STRUCTURE_PROVIDERS.get("None"));

141

}

142

SeqCigar newSeqCigar = scig; // new SeqCigar(scig);

143

newCigs.add(newSeqCigar);

ssForSeqs.add(null);

}

else

{

for (int i = 0; i < ssec.size(); i++)

{

if (alSeq != null)

{

// Add annotationDetails if the annotation has

153

// ANNOTATION_DETAILS property value (additional metadata)

154

155

if (ssec.get(i).hasAnnotationDetailsProperty())

156

{

157

// using key = labels.size() gives the position of the node

158

annotationDetails.put(labels.size(), ssec.get(i).getAnnotationDetailsProperty());

159

}

160

161

String provider = AlignmentAnnotationUtils

162

.extractSSSourceFromAnnotationDescription(ssec.get(i));

163

labels.add(provider);

164

}

165

newSequences.add(alSeq);

166

SeqCigar newSeqCigar = scig; // new SeqCigar(scig);

167

newCigs.add(newSeqCigar);

168

ssForSeqs.add(ssec.get(i));

}

}

}

ssAnnotationForSeqs.addAll(ssForSeqs);

173

seqData.setSequences(newCigs.toArray(new SeqCigar[0]));

174

return newSequences.toArray(new SequenceI[0]);

}

/**

* Calculates distance score [i][j] between each pair of protein sequences

180

* based on their secondary structure annotations (H, E, C). The final score

181

* is normalised by the number of alignment columns processed, providing an

182

* average similarity score.

183

* <p>

184

* The parameters argument can include settings for handling gap-residue

185

* aligned positions and may determine if the score calculation is based on

186

* the longer or shorter sequence in each pair. This can be important for

187

* handling partial alignments or sequences of significantly different

* lengths.

* @param seqData

* The aligned sequence data including secondary structure

192

* annotations.

193

* @param params

194

* Additional parameters for customising the scoring process, such as

195

* gap handling and sequence length consideration.

196

197

@Override

198

public MatrixI findDistances(AlignmentView seqData,

199

SimilarityParamsI params)

200

{

201

if (ssForSeqs == null

202

|| ssForSeqs.size() != seqData.getSequences().length)

203

{

204

// expandSeqData needs to be called to initialise the hash

205

SequenceI[] sequences = new SequenceI[seqData.getSequences().length];

206

// we throw away the new labels in this case..

207

expandSeqData(sequences, seqData, params, new ArrayList<String>(),

208

new ArrayList<AlignmentAnnotation>(), new HashMap<Integer, String>());

209

}

210

SeqCigar[] seqs = seqData.getSequences();

211

int noseqs = seqs.length; // no of sequences

212

int cpwidth = 0;

213

double[][] similarities = new double[noseqs][noseqs]; // matrix to store

214

// similarity score

215

// secondary structure source parameter selected by the user from the drop

216

// down.

217

String ssSource = params.getSecondaryStructureSource();

218

if (ssSource == null || ssSource == "")

219

{

220

ssSource = Constants.SS_ALL_PROVIDERS;

221

}

222

ssRateMatrix = ScoreModels.getInstance().getSecondaryStructureMatrix();

223

224

// need to get real position for view position

225

int[] viscont = seqData.getVisibleContigs();

226

227

228

* scan each column, compute and add to each similarity[i, j]

229

* the number of secondary structure annotation that seqi

230

* and seqj do not share

231

232

for (int vc = 0; vc < viscont.length; vc += 2)

233

{

234

// Iterates for each column position

235

152

for (int cpos = viscont[vc]; cpos <= viscont[vc + 1]; cpos++)

236

{

237

141

cpwidth++; // used to normalise the similarity score

238

239

240

* get set of sequences without gap in the current column

241

242

141

Set<SeqCigar> seqsWithoutGapAtCol = findSeqsWithoutGapAtColumn(seqs,

cpos);

* calculate similarity score for each secondary structure annotation on i'th and j'th

247

* sequence and add this measure to the similarities matrix

248

* for [i, j] for j > i

249

250

1898

for (int i = 0; i < (noseqs - 1); i++)

251

{

252

1757

AlignmentAnnotation aa_i = ssForSeqs.get(i);

253

1757

boolean undefinedSS1 = aa_i == null;

254

// check if the sequence contains gap in the current column

255

1757

boolean gap1 = !seqsWithoutGapAtCol.contains(seqs[i]);

256

// secondary structure is fetched only if the current column is not

257

// gap for the sequence

258

1757

char ss1 = '*';

259

1757

if (!gap1 && !undefinedSS1)

260

{

261

// fetch the position in sequence for the column and finds the

262

// corresponding secondary structure annotation

263

// TO DO - consider based on priority and displayed

264

376

int seqPosition_i = seqs[i].findPosition(cpos);

265

376

if (aa_i != null)

266

376

ss1 = AlignmentUtils.findSSAnnotationForGivenSeqposition(aa_i,

267

seqPosition_i);

268

}

269

// Iterates for each sequences

270

17250

for (int j = i + 1; j < noseqs; j++)

271

{

272

273

// check if ss is defined

274

15493

AlignmentAnnotation aa_j = ssForSeqs.get(j);

275

15493

boolean undefinedSS2 = aa_j == null;

276

277

// Set similarity to max score if both SS are not defined

278

15493

if (undefinedSS1 && undefinedSS2)

279

{

280

9231

similarities[i][j] += ssRateMatrix.getMaximumScore();

281

9231

continue;

282

}

283

284

// Set similarity to minimum score if either one SS is not defined

285

6262

else if (undefinedSS1 || undefinedSS2)

286

{

287

5656

similarities[i][j] += ssRateMatrix.getMinimumScore();

288

5656

continue;

289

}

290

291

606

boolean gap2 = !seqsWithoutGapAtCol.contains(seqs[j]);

292

293

// Variable to store secondary structure at the current column

294

606

char ss2 = '*';

295

296

606

if (!gap2 && !undefinedSS2)

297

{

298

564

int seqPosition = seqs[j].findPosition(cpos);

299

300

564

if (aa_j != null)

301

564

ss2 = AlignmentUtils.findSSAnnotationForGivenSeqposition(

aa_j, seqPosition);

}

606

if ((!gap1 && !gap2) || params.includeGaps())

306

{

307

// Calculate similarity score based on the substitution matrix

308

606

double similarityScore = ssRateMatrix.getPairwiseScore(ss1,

309

ss2);

310

606

similarities[i][j] += similarityScore;

}

}

}

}

}

* normalise the similarity scores (summed over columns) by the

319

* number of visible columns used in the calculation

320

* and fill in the bottom half of the matrix

321

322

// TODO JAL-2424 cpwidth may be out by 1 - affects scores but not tree shape

323

324

for (int i = 0; i < noseqs; i++)

325

{

326

201

for (int j = i + 1; j < noseqs; j++)

327

{

328

163

similarities[i][j] /= cpwidth;

329

163

similarities[j][i] = similarities[i][j];

330

}

331

}

332

return SimilarityScoreModel

333

.similarityToDistance(new Matrix(similarities));

}

/**

* Builds and returns a set containing sequences (SeqCigar) which do not have

339

* a gap at the given column position.

340

341

* @param seqs

342

* @param columnPosition

* (0..)

* @return

141

private Set<SeqCigar> findSeqsWithoutGapAtColumn(SeqCigar[] seqs,

347

int columnPosition)

348

{

349

141

Set<SeqCigar> seqsWithoutGapAtCol = new HashSet<>();

350

141

for (SeqCigar seq : seqs)

351

{

352

1898

int spos = seq.findPosition(columnPosition);

353

1898

if (spos != -1)

354

{

355

356

* position is not a gap

357

358

1587

seqsWithoutGapAtCol.add(seq);

359

}

360

}

361

141

return seqsWithoutGapAtCol;

362

}

363

364

157

@Override

365

public String getName()

366

{

367

157

return NAME;

}

@Override

public String getDescription()

{

return description;

}

@Override

public boolean isDNA()

{

return false;

}

@Override

public boolean isProtein()

{

return false;

}

@Override

public boolean isSecondaryStructure()

{

return true;

}

@Override

public String toString()

396

{

397

return "Score between sequences based on similarity between binary "

398

+ "vectors marking secondary structure displayed at each column";

399

}

400

}

Coverage Report

File SecondaryStructureDistanceModel.java

Coverage histogram

Code metrics

Classes

Class SecondaryStructureDistanceModel

Contributing tests

Contributing tests

Source view