File AAFrequency.java

Branches:

Statements:

218

Methods:

Classes:

LOC:

721

NCLOC:

424

Total complexity:

Complexity density:

0.34

Statements/Method:

16.77

Methods/Class:

Average method complexity:

5.69

Classes

Class	Line #	Total Statements	Complexity	Uncovered Elements	TOTAL Coverage	Actions
AAFrequency	54	218	74	74	0.77507677.5%

Class AAFrequency

Class AAFrequency	Line # 54	Total Statements 218	Complexity 74	Uncovered Elements 74	TOTAL Coverage 0.77507677.5%
<clinit>, line 63() <clinit>, line 63()	6363	2.02	2.02	0.00	1.0 1.0100%
calculate(List<SequenceI>,int,int) : ProfilesI calculate(List<SequenceI>,int,int) : ProfilesI	7171	1.01	1.01	0.00	1.0 1.0100%
calculate(List<SequenceI>,int,int,boolean) : ProfilesI calculate(List<SequenceI>,int,int,boolean) : ProfilesI	7777	12.012	4.04	0.00	1.0 1.0100%
calculate(SequenceI[],int,int,int,boolean) : ProfilesI calculate(SequenceI[],int,int,int,boolean) : ProfilesI	117117	29.029	10.010	3.03	0.93333334 0.9333333493.3%
estimateProfileSize(SparseIntArray) : int estimateProfileSize(SparseIntArray) : int	204204	3.03	2.02	5.05	0.0 0.00%
completeConsensus(AlignmentAnnotation,ProfilesI,int,int,boolean,boolean,long) : void completeConsensus(AlignmentAnnotation,ProfilesI,int,int,boolean,boolean,long) : void	240240	16.016	8.08	5.05	0.8076923 0.807692380.8%
completeGapAnnot(AlignmentAnnotation,ProfilesI,int,int,long) : void completeGapAnnot(AlignmentAnnotation,ProfilesI,int,int,long) : void	303303	13.013	6.06	5.05	0.7368421 0.736842173.7%
getTooltip(ProfileI,float,boolean,boolean,int) : String getTooltip(ProfileI,float,boolean,boolean,int) : String	361361	16.016	6.06	0.00	1.0 1.0100%
extractProfile(ProfileI,boolean) : int[] extractProfile(ProfileI,boolean) : int[]	412412	24.024	4.04	2.02	0.93333334 0.9333333493.3%
extractCdnaProfile(Hashtable,boolean) : int[] extractCdnaProfile(Hashtable,boolean) : int[]	464464	25.025	5.05	33.033	0.0 0.00%
calculateCdna(AlignmentI,Hashtable[]) : void calculateCdna(AlignmentI,Hashtable[]) : void	520520	22.022	6.06	3.03	0.9 0.990%
completeCdnaConsensus(AlignmentAnnotation,Hashtable[],boolean,int) : void completeCdnaConsensus(AlignmentAnnotation,Hashtable[],boolean,int) : void	577577	50.050	18.018	13.013	0.8243243 0.824324382.4%
getPercentageDp(long) : int getPercentageDp(long) : int	711711	5.05	2.02	3.03	0.5714286 0.571428657.1%

Contributing tests

This file is covered by 82 tests. .

Contributing tests

Test contribution	Test	Result
0.5744681	jalview.io.FeaturesFileTest.simpleGff3FileLoaderjalview.io.FeaturesFileTest.simpleGff3FileLoader	1PASS
0.48024315	jalview.io.Jalview2xmlTests.testStoreAndRecoverExpandedviewsjalview.io.Jalview2xmlTests.testStoreAndRecoverExpandedviews	1PASS
0.48024315	jalview.io.Jalview2xmlTests.gatherViewsHerejalview.io.Jalview2xmlTests.gatherViewsHere	1PASS
0.48024315	jalview.io.Jalview2xmlTests.testStoreAndRecoverReferenceSeqSettingsjalview.io.Jalview2xmlTests.testStoreAndRecoverReferenceSeqSettings	1PASS
0.48024315	jalview.io.Jalview2xmlTests.testCopyViewSettingsjalview.io.Jalview2xmlTests.testCopyViewSettings	1PASS
0.48024315	jalview.io.Jalview2xmlTests.viewRefPdbAnnotationjalview.io.Jalview2xmlTests.viewRefPdbAnnotation	1PASS
0.48024315	jalview.io.Jalview2xmlTests.noDuplicatePdbMappingsMadejalview.io.Jalview2xmlTests.noDuplicatePdbMappingsMade	1PASS
0.443769	jalview.io.Jalview2xmlTests.testStoreAndRecoverColourThresholdsjalview.io.Jalview2xmlTests.testStoreAndRecoverColourThresholds	1PASS
0.44072947	jalview.io.Jalview2xmlTests.testColourByAnnotScoresjalview.io.Jalview2xmlTests.testColourByAnnotScores	1PASS
0.38905776	jalview.io.Jalview2xmlTests.testStoreAndRecoverGroupRepSeqsjalview.io.Jalview2xmlTests.testStoreAndRecoverGroupRepSeqs	1PASS
0.38601825	jalview.io.Jalview2xmlTests.testTCoffeeScoresjalview.io.Jalview2xmlTests.testTCoffeeScores	1PASS
0.3799392	jalview.io.Jalview2xmlTests.testRNAStructureRecoveryjalview.io.Jalview2xmlTests.testRNAStructureRecovery	1PASS
0.36474165	jalview.io.Jalview2xmlTests.testSaveLoadFeatureColoursAndFiltersjalview.io.Jalview2xmlTests.testSaveLoadFeatureColoursAndFilters	1PASS
0.36474165	jalview.io.JSONFileTest.testGrpParsed_colourNonejalview.io.JSONFileTest.testGrpParsed_colourNone	1PASS
0.3586626	jalview.io.JSONFileTest.testBioJSONRoundTripWithColourSchemeNonejalview.io.JSONFileTest.testBioJSONRoundTripWithColourSchemeNone	1PASS
0.3586626	jalview.gui.AlignFrameTest.testNewView_colourThresholdsjalview.gui.AlignFrameTest.testNewView_colourThresholds	1PASS
0.30395138	jalview.ext.jmol.JmolViewerTest.testAddStrToSingleSeqViewJMoljalview.ext.jmol.JmolViewerTest.testAddStrToSingleSeqViewJMol	1PASS
0.30395138	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistances_withParamsjalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistances_withParams	1PASS
0.30395138	jalview.io.gff.ExonerateHelperTest.testAddExonerateGffToAlignmentjalview.io.gff.ExonerateHelperTest.testAddExonerateGffToAlignment	1PASS
0.30395138	jalview.gui.AlignViewportTest.testGetConsensusSeqjalview.gui.AlignViewportTest.testGetConsensusSeq	1PASS
0.30091184	jalview.gui.PairwiseAlignmentPanelTest.testConstructor_withSelectionGroupjalview.gui.PairwiseAlignmentPanelTest.testConstructor_withSelectionGroup	1PASS
0.30091184	jalview.io.FeaturesFileTest.testPrintJalviewFormatjalview.io.FeaturesFileTest.testPrintJalviewFormat	1PASS
0.30091184	jalview.gui.SeqCanvasTest.testCalculateWrappedGeometry_withAnnotationsjalview.gui.SeqCanvasTest.testCalculateWrappedGeometry_withAnnotations	1PASS
0.30091184	jalview.io.FeaturesFileTest.testParsejalview.io.FeaturesFileTest.testParse	1PASS
0.30091184	jalview.gui.AlignViewportTest.testSetGlobalColourSchemejalview.gui.AlignViewportTest.testSetGlobalColourScheme	1PASS
0.30091184	jalview.controller.AlignViewControllerTest.testFindColumnsWithFeaturejalview.controller.AlignViewControllerTest.testFindColumnsWithFeature	1PASS
0.30091184	jalview.gui.AlignViewportTest.testSetSelectionGroupjalview.gui.AlignViewportTest.testSetSelectionGroup	1PASS
0.30091184	jalview.gui.SeqCanvasTest.testCalculateWrappedGeometry_fromScrolledjalview.gui.SeqCanvasTest.testCalculateWrappedGeometry_fromScrolled	3FAIL
0.30091184	jalview.io.JalviewExportPropertiesTests.testImportExportPeriodGapsjalview.io.JalviewExportPropertiesTests.testImportExportPeriodGaps	1PASS
0.30091184	jalview.gui.AlignViewportTest.testShowOrDontShowOccupancyjalview.gui.AlignViewportTest.testShowOrDontShowOccupancy	1PASS
0.30091184	jalview.io.FeaturesFileTest.testParse_jalviewFeaturesOnlyjalview.io.FeaturesFileTest.testParse_jalviewFeaturesOnly	1PASS
0.30091184	jalview.gui.SeqCanvasTest.testCalculateWrappedGeometry_noAnnotationsjalview.gui.SeqCanvasTest.testCalculateWrappedGeometry_noAnnotations	1PASS
0.30091184	jalview.io.FeaturesFileTest.testParse_mixedJalviewGffjalview.io.FeaturesFileTest.testParse_mixedJalviewGff	1PASS
0.30091184	jalview.io.Jalview2xmlTests.testStoreAndRecoverPDBEntryjalview.io.Jalview2xmlTests.testStoreAndRecoverPDBEntry	1PASS
0.30091184	jalview.gui.AlignViewportTest.testSetGetHasSearchResultsjalview.gui.AlignViewportTest.testSetGetHasSearchResults	1PASS
0.30091184	jalview.io.FeaturesFileTest.testPrintGffFormatjalview.io.FeaturesFileTest.testPrintGffFormat	1PASS
0.30091184	jalview.schemes.ColourSchemesTest.testRegisterColourSchemejalview.schemes.ColourSchemesTest.testRegisterColourScheme	1PASS
0.30091184	jalview.io.FeaturesFileTest.testParse_pureGff3jalview.io.FeaturesFileTest.testParse_pureGff3	1PASS
0.30091184	jalview.gui.PairwiseAlignmentPanelTest.testConstructor_noSelectionGroupjalview.gui.PairwiseAlignmentPanelTest.testConstructor_noSelectionGroup	1PASS
0.29483283	jalview.io.vcf.VCFLoaderTest.testDoLoad_reverseStrandjalview.io.vcf.VCFLoaderTest.testDoLoad_reverseStrand	1PASS
0.29483283	jalview.io.vcf.VCFLoaderTest.testDoLoad_vepCsqjalview.io.vcf.VCFLoaderTest.testDoLoad_vepCsq	1PASS
0.29483283	jalview.io.vcf.VCFLoaderTest.testDoLoadjalview.io.vcf.VCFLoaderTest.testDoLoad	1PASS
0.29179332	jalview.ext.rbvi.chimera.ChimeraCommandsTest.testGetColourBySequenceCommands_hiddenColumnsjalview.ext.rbvi.chimera.ChimeraCommandsTest.testGetColourBySequenceCommands_hiddenColumns	1PASS
0.29179332	jalview.ext.jmol.JmolCommandsTest.testGetColourBySequenceCommand_noFeaturesjalview.ext.jmol.JmolCommandsTest.testGetColourBySequenceCommand_noFeatures	1PASS
0.29179332	jalview.renderer.seqfeatures.FeatureRendererTest.testFindFeaturesAtColumnjalview.renderer.seqfeatures.FeatureRendererTest.testFindFeaturesAtColumn	1PASS
0.29179332	jalview.ext.jmol.JmolCommandsTest.testGetColourBySequenceCommands_hiddenColumnsjalview.ext.jmol.JmolCommandsTest.testGetColourBySequenceCommands_hiddenColumns	1PASS
0.29179332	jalview.controller.AlignViewControllerTest.testSelectColumnsWithHighlightjalview.controller.AlignViewControllerTest.testSelectColumnsWithHighlight	1PASS
0.29179332	jalview.ext.jmol.JmolViewerTest.testSingleSeqViewJMoljalview.ext.jmol.JmolViewerTest.testSingleSeqViewJMol	1PASS
0.29179332	jalview.schemes.ClustalxColourSchemeTest.testFindColourjalview.schemes.ClustalxColourSchemeTest.testFindColour	1PASS
0.29179332	jalview.io.AnnotatedPDBFileInputTest.testJalviewProjectRelocationAnnotationjalview.io.AnnotatedPDBFileInputTest.testJalviewProjectRelocationAnnotation	1PASS
0.28267476	jalview.gui.SeqPanelTest.testAmbiguousAminoAcidGetsStatusMessagejalview.gui.SeqPanelTest.testAmbiguousAminoAcidGetsStatusMessage	1PASS
0.28267476	jalview.gui.AnnotationChooserTest.testBuildApplyToOptionsPanel_withSelectionGroupjalview.gui.AnnotationChooserTest.testBuildApplyToOptionsPanel_withSelectionGroup	1PASS
0.28267476	jalview.gui.SeqPanelTest.testSetStatusReturnsNearestResiduePositionjalview.gui.SeqPanelTest.testSetStatusReturnsNearestResiduePosition	1PASS
0.28267476	jalview.schemes.PIDColourSchemeTest.testFindColour_ignoreGapsjalview.schemes.PIDColourSchemeTest.testFindColour_ignoreGaps	1PASS
0.27963525	jalview.io.gff.GffTests.testResolveExonerateGffjalview.io.gff.GffTests.testResolveExonerateGff	1PASS
0.27963525	jalview.renderer.seqfeatures.FeatureRendererTest.testFilterFeaturesForDisplayjalview.renderer.seqfeatures.FeatureRendererTest.testFilterFeaturesForDisplay	1PASS
0.27963525	jalview.renderer.seqfeatures.FeatureRendererTest.testGetColourjalview.renderer.seqfeatures.FeatureRendererTest.testGetColour	1PASS
0.27963525	jalview.renderer.seqfeatures.FeatureRendererTest.testFindAllFeaturesjalview.renderer.seqfeatures.FeatureRendererTest.testFindAllFeatures	1PASS
0.27963525	jalview.gui.AlignViewportTest.testDeregisterMapping_withReferencejalview.gui.AlignViewportTest.testDeregisterMapping_withReference	1PASS
0.27963525	jalview.schemes.ColourSchemesTest.testGetColourSchemejalview.schemes.ColourSchemesTest.testGetColourScheme	1PASS
0.27963525	jalview.gui.AlignFrameTest.testHideFeatureColumnsjalview.gui.AlignFrameTest.testHideFeatureColumns	1PASS
0.27963525	jalview.gui.AlignViewportTest.testDeregisterMapping_withNoReferencejalview.gui.AlignViewportTest.testDeregisterMapping_withNoReference	1PASS
0.27963525	jalview.gui.PaintRefresherTest.testGetAssociatedPanelsjalview.gui.PaintRefresherTest.testGetAssociatedPanels	1PASS
0.27963525	jalview.renderer.ScaleRendererTest.testCalculateMarksjalview.renderer.ScaleRendererTest.testCalculateMarks	1PASS
0.27963525	jalview.gui.FeatureSettingsTest.testSaveLoadjalview.gui.FeatureSettingsTest.testSaveLoad	1PASS
0.27963525	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistances	1PASS
0.27659574	jalview.schemes.ClustalxColourSchemeTest.testFindColour_ignoreGapsjalview.schemes.ClustalxColourSchemeTest.testFindColour_ignoreGaps	1PASS
0.27355623	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModeljalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel	1PASS
0.27355623	jalview.datamodel.AlignmentViewTest.testGetVisibleContigsjalview.datamodel.AlignmentViewTest.testGetVisibleContigs	1PASS
0.27355623	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_hiddenFirstColumnjalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_hiddenFirstColumn	1PASS
0.27355623	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_HiddenColumnsjalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_HiddenColumns	1PASS
0.2674772	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFindFeatureAt_PointFeaturejalview.analysis.scoremodels.FeatureDistanceModelTest.testFindFeatureAt_PointFeature	1PASS
0.2674772	jalview.gui.AlignViewportTest.testDeregisterMapping_onCloseViewjalview.gui.AlignViewportTest.testDeregisterMapping_onCloseView	1PASS
0.25531915	jalview.gui.AlignViewportTest.testUpdateConservation_qualityOnlyjalview.gui.AlignViewportTest.testUpdateConservation_qualityOnly	1PASS
0.25227964	jalview.analysis.AAFrequencyTest.testCompleteConsensus_ignoreGaps_noLogojalview.analysis.AAFrequencyTest.testCompleteConsensus_ignoreGaps_noLogo	1PASS
0.24012157	jalview.gui.AlignFrameTest.testChangeColour_background_groupsAndThresholdsjalview.gui.AlignFrameTest.testChangeColour_background_groupsAndThresholds	1PASS
0.21884498	jalview.analysis.AAFrequencyTest.testCompleteConsensus_includeGaps_showLogojalview.analysis.AAFrequencyTest.testCompleteConsensus_includeGaps_showLogo	1PASS
0.1762918	jalview.io.AnnotationFileIOTest.exampleAnnotationFileIOjalview.io.AnnotationFileIOTest.exampleAnnotationFileIO	1PASS
0.16413374	jalview.analysis.GroupingTest.testMakeGroupsWithBothjalview.analysis.GroupingTest.testMakeGroupsWithBoth	1PASS
0.10942249	jalview.analysis.AAFrequencyTest.testCalculate_withProfilejalview.analysis.AAFrequencyTest.testCalculate_withProfile	1PASS
0.10638298	jalview.analysis.AAFrequencyTest.testCalculate_noProfilejalview.analysis.AAFrequencyTest.testCalculate_noProfile	1PASS
0.08510638	jalview.structure.StructureSelectionManagerTest.testSetMapping_seqFeaturesjalview.structure.StructureSelectionManagerTest.testSetMapping_seqFeatures	1PASS

Source view

* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)

* Copyright (C) $$Year-Rel$$ The Jalview Authors

* This file is part of Jalview.

* Jalview is free software: you can redistribute it and/or

* modify it under the terms of the GNU General Public License

* as published by the Free Software Foundation, either version 3

* of the License, or (at your option) any later version.

* Jalview is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty

* of MERCHANTABILITY or FITNESS FOR A PARTICULAR

* PURPOSE. See the GNU General Public License for more details.

* You should have received a copy of the GNU General Public License

* along with Jalview. If not, see <http://www.gnu.org/licenses/>.

* The Jalview Authors are detailed in the 'AUTHORS' file.

package jalview.analysis;

import jalview.datamodel.AlignedCodonFrame;

import jalview.datamodel.AlignmentAnnotation;

import jalview.datamodel.AlignmentI;

import jalview.datamodel.Annotation;

import jalview.datamodel.Profile;

import jalview.datamodel.ProfileI;

import jalview.datamodel.Profiles;

import jalview.datamodel.ProfilesI;

import jalview.datamodel.ResidueCount;

import jalview.datamodel.ResidueCount.SymbolCounts;

import jalview.datamodel.SequenceI;

import jalview.ext.android.SparseIntArray;

import jalview.util.Comparison;

import jalview.util.Format;

import jalview.util.MappingUtils;

import jalview.util.QuickSort;

import java.awt.Color;

import java.util.Arrays;

import java.util.Hashtable;

import java.util.List;

/**

* Takes in a vector or array of sequences and column start and column end and

* returns a new Hashtable[] of size maxSeqLength, if Hashtable not supplied.

* This class is used extensively in calculating alignment colourschemes that

* depend on the amount of conservation in each alignment column.

* @author $author$

* @version $Revision$

public class AAFrequency

{

public static final String PROFILE = "P";

* Quick look-up of String value of char 'A' to 'Z'

private static final String[] CHARS = new String['Z' - 'A' + 1];

static

{

for (char c = 'A'; c <= 'Z'; c++)

{

CHARS[c - 'A'] = String.valueOf(c);

}

public static final ProfilesI calculate(List<SequenceI> list, int start,

int end)

{

return calculate(list, start, end, false);

}

473

public static final ProfilesI calculate(List<SequenceI> sequences,

int start, int end, boolean profile)

{

473

SequenceI[] seqs = new SequenceI[sequences.size()];

473

int width = 0;

473

synchronized (sequences)

{

4047

for (int i = 0; i < sequences.size(); i++)

{

3574

seqs[i] = sequences.get(i);

3574

int length = seqs[i].getLength();

3574

if (length > width)

{

483

width = length;

}

473

if (end >= width)

{

281

end = width;

}

473

ProfilesI reply = calculate(seqs, width, start, end, profile);

100

473

return reply;

}

}

/**

* Calculate the consensus symbol(s) for each column in the given range.

* @param sequences

* @param width

* the full width of the alignment

110

* @param start

111

* start column (inclusive, base zero)

112

* @param end

113

* end column (exclusive)

114

* @param saveFullProfile

115

* if true, store all symbol counts

116

117

936

public static final ProfilesI calculate(final SequenceI[] sequences,

118

int width, int start, int end, boolean saveFullProfile)

119

{

120

// long now = System.currentTimeMillis();

121

936

int seqCount = sequences.length;

122

936

boolean nucleotide = false;

123

936

int nucleotideCount = 0;

124

936

int peptideCount = 0;

125

126

936

ProfileI[] result = new ProfileI[width];

127

128

118435

for (int column = start; column < end; column++)

129

{

130

131

* Apply a heuristic to detect nucleotide data (which can

132

* be counted in more compact arrays); here we test for

133

* more than 90% nucleotide; recheck every 10 columns in case

134

* of misleading data e.g. highly conserved Alanine in peptide!

135

* Mistakenly guessing nucleotide has a small performance cost,

136

* as it will result in counting in sparse arrays.

137

* Mistakenly guessing peptide has a small space cost,

138

* as it will use a larger than necessary array to hold counts.

139

140

117502

if (nucleotideCount > 100 && column % 10 == 0)

141

{

142

5708

nucleotide = (9 * peptideCount < nucleotideCount);

143

}

144

117498

ResidueCount residueCounts = new ResidueCount(nucleotide);

145

146

1191097

for (int row = 0; row < seqCount; row++)

147

{

148

1073668

if (sequences[row] == null)

149

{

150

System.err.println(

151

"WARNING: Consensus skipping null sequence - possible race condition.");

152

continue;

153

}

154

1073563

if (sequences[row].getLength() > column)

155

{

156

1061259

char c = sequences[row].getCharAt(column);

157

1061199

residueCounts.add(c);

158

1062601

if (Comparison.isNucleotide(c))

159

{

160

275069

nucleotideCount++;

161

}

162

787723

else if (!Comparison.isGap(c))

163

{

164

659832

peptideCount++;

}

}

else

{

* count a gap if the sequence doesn't reach this column

171

172

12355

residueCounts.addGap();

}

}

117486

int maxCount = residueCounts.getModalCount();

177

117484

String maxResidue = residueCounts.getResiduesForCount(maxCount);

178

117499

int gapCount = residueCounts.getGapCount();

179

117499

ProfileI profile = new Profile(seqCount, gapCount, maxCount,

180

maxResidue);

181

182

117505

if (saveFullProfile)

183

{

184

96615

profile.setCounts(residueCounts);

185

}

186

187

117501

result[column] = profile;

188

}

189

936

return new Profiles(result);

190

// long elapsed = System.currentTimeMillis() - now;

191

// System.out.println(elapsed);

}

/**

* Make an estimate of the profile size we are going to compute i.e. how many

196

* different characters may be present in it. Overestimating has a cost of

197

* using more memory than necessary. Underestimating has a cost of needing to

198

* extend the SparseIntArray holding the profile counts.

199

200

* @param profileSizes

201

* counts of sizes of profiles so far encountered

202

* @return

203

204

static int estimateProfileSize(SparseIntArray profileSizes)

205

{

206

if (profileSizes.size() == 0)

{

return 4;

}

* could do a statistical heuristic here e.g. 75%ile

213

* for now just return the largest value

214

215

return profileSizes.keyAt(profileSizes.size() - 1);

}

/**

* Derive the consensus annotations to be added to the alignment for display.

220

* This does not recompute the raw data, but may be called on a change in

221

* display options, such as 'ignore gaps', which may in turn result in a

222

* change in the derived values.

223

224

* @param consensus

225

* the annotation row to add annotations to

226

* @param profiles

227

* the source consensus data

228

* @param startCol

229

* start column (inclusive)

230

* @param endCol

231

* end column (exclusive)

232

* @param ignoreGaps

233

* if true, normalise residue percentages ignoring gaps

234

* @param showSequenceLogo

235

* if true include all consensus symbols, else just show modal

236

* residue

237

* @param nseq

238

* number of sequences

239

240

665

public static void completeConsensus(AlignmentAnnotation consensus,

241

ProfilesI profiles, int startCol, int endCol, boolean ignoreGaps,

242

boolean showSequenceLogo, long nseq)

243

{

244

// long now = System.currentTimeMillis();

245

665

if (consensus == null || consensus.annotations == null

246

|| consensus.annotations.length < endCol)

247

{

248

249

* called with a bad alignment annotation row

250

* wait for it to be initialised properly

return;

}

96547

for (int i = startCol; i < endCol; i++)

256

{

257

95882

ProfileI profile = profiles.get(i);

258

95884

if (profile == null)

259

{

260

261

* happens if sequences calculated over were

262

* shorter than alignment width

263

264

consensus.annotations[i] = null;

return;

}

95886

final int dp = getPercentageDp(nseq);

269

270

95884

float value = profile.getPercentageIdentity(ignoreGaps);

271

272

95885

String description = getTooltip(profile, value, showSequenceLogo,

273

ignoreGaps, dp);

274

275

95890

String modalResidue = profile.getModalResidue();

276

95890

if ("".equals(modalResidue))

277

{

278

1498

modalResidue = "-";

279

}

280

94393

else if (modalResidue.length() > 1)

281

{

282

6608

modalResidue = "+";

283

}

284

95888

consensus.annotations[i] = new Annotation(modalResidue, description,

285

' ', value);

286

}

287

// long elapsed = System.currentTimeMillis() - now;

288

// System.out.println(-elapsed);

}

/**

* Derive the gap count annotation row.

293

294

* @param gaprow

295

* the annotation row to add annotations to

296

* @param profiles

297

* the source consensus data

298

* @param startCol

299

* start column (inclusive)

300

* @param endCol

301

* end column (exclusive)

302

303

481

public static void completeGapAnnot(AlignmentAnnotation gaprow,

304

ProfilesI profiles, int startCol, int endCol, long nseq)

305

{

306

481

if (gaprow == null || gaprow.annotations == null

307

|| gaprow.annotations.length < endCol)

308

{

309

310

* called with a bad alignment annotation row

311

* wait for it to be initialised properly

return;

}

// always set ranges again

316

481

gaprow.graphMax = nseq;

317

481

gaprow.graphMin = 0;

318

481

double scale = 0.8 / nseq;

319

67795

for (int i = startCol; i < endCol; i++)

320

{

321

67314

ProfileI profile = profiles.get(i);

322

67314

if (profile == null)

323

{

324

325

* happens if sequences calculated over were

326

* shorter than alignment width

327

328

gaprow.annotations[i] = null;

return;

}

67314

final int gapped = profile.getNonGapped();

333

334

67314

String description = "" + gapped;

335

336

67314

gaprow.annotations[i] = new Annotation("", description, '\0', gapped,

337

jalview.util.ColorUtils.bleachColour(Color.DARK_GRAY,

338

(float) scale * gapped));

}

}

/**

* Returns a tooltip showing either

344

* <ul>

345

* <li>the full profile (percentages of all residues present), if

346

* showSequenceLogo is true, or</li>

347

* <li>just the modal (most common) residue(s), if showSequenceLogo is

348

* false</li>

349

* </ul>

350

* Percentages are as a fraction of all sequence, or only ungapped sequences

351

* if ignoreGaps is true.

* @param profile

* @param pid

* @param showSequenceLogo

356

* @param ignoreGaps

357

* @param dp

358

* the number of decimal places to format percentages to

359

* @return

360

361

95884

static String getTooltip(ProfileI profile, float pid,

362

boolean showSequenceLogo, boolean ignoreGaps, int dp)

363

{

364

95884

ResidueCount counts = profile.getCounts();

365

366

95881

String description = null;

367

95892

if (counts != null && showSequenceLogo)

368

{

369

48518

int normaliseBy = ignoreGaps ? profile.getNonGapped()

370

: profile.getHeight();

371

48513

description = counts.getTooltip(normaliseBy, dp);

}

else

{

47380

StringBuilder sb = new StringBuilder(64);

376

47380

String maxRes = profile.getModalResidue();

377

47380

if (maxRes.length() > 1)

378

{

379

2230

sb.append("[").append(maxRes).append("]");

}

else

{

45150

sb.append(maxRes);

384

}

385

47380

if (maxRes.length() > 0)

386

{

387

46783

sb.append(" ");

388

46783

Format.appendPercentage(sb, pid, dp);

389

46783

sb.append("%");

390

}

391

47380

description = sb.toString();

392

}

393

95890

return description;

}

/**

* Returns the sorted profile for the given consensus data. The returned array

* contains

* <pre>

* [profileType, numberOfValues, nonGapCount, charValue1, percentage1, charValue2, percentage2, ...]

402

* in descending order of percentage value

* </pre>

* @param profile

* the data object from which to extract and sort values

407

* @param ignoreGaps

408

* if true, only non-gapped values are included in percentage

* calculations

* @return

48860

public static int[] extractProfile(ProfileI profile, boolean ignoreGaps)

413

{

414

48860

int[] rtnval = new int[64];

415

48860

ResidueCount counts = profile.getCounts();

416

48860

if (counts == null)

{

return null;

}

48860

SymbolCounts symbolCounts = counts.getSymbolCounts();

422

48860

char[] symbols = symbolCounts.symbols;

423

48860

int[] values = symbolCounts.values;

424

48860

QuickSort.sort(values, symbols);

425

48860

int nextArrayPos = 2;

426

48860

int totalPercentage = 0;

427

48860

final int divisor = ignoreGaps ? profile.getNonGapped()

428

: profile.getHeight();

429

430

431

* traverse the arrays in reverse order (highest counts first)

432

433

128760

for (int i = symbols.length - 1; i >= 0; i--)

434

{

435

79900

int theChar = symbols[i];

436

79900

int charCount = values[i];

437

438

79900

rtnval[nextArrayPos++] = theChar;

439

79900

final int percentage = (charCount * 100) / divisor;

440

79900

rtnval[nextArrayPos++] = percentage;

441

79900

totalPercentage += percentage;

442

}

443

48860

rtnval[0] = symbols.length;

444

48860

rtnval[1] = totalPercentage;

445

48860

int[] result = new int[rtnval.length + 1];

446

48860

result[0] = AlignmentAnnotation.SEQUENCE_PROFILE;

447

48860

System.arraycopy(rtnval, 0, result, 1, rtnval.length);

448

449

48860

return result;

}

/**

* Extract a sorted extract of cDNA codon profile data. The returned array

* contains

* <pre>

* [profileType, numberOfValues, totalCount, charValue1, percentage1, charValue2, percentage2, ...]

458

* in descending order of percentage value, where the character values encode codon triplets

* </pre>

* @param hashtable

* @return

public static int[] extractCdnaProfile(Hashtable hashtable,

465

boolean ignoreGaps)

466

{

467

// this holds #seqs, #ungapped, and then codon count, indexed by encoded

468

// codon triplet

469

int[] codonCounts = (int[]) hashtable.get(PROFILE);

470

int[] sortedCounts = new int[codonCounts.length - 2];

471

System.arraycopy(codonCounts, 2, sortedCounts, 0,

472

codonCounts.length - 2);

473

474

int[] result = new int[3 + 2 * sortedCounts.length];

475

// first value is just the type of profile data

476

result[0] = AlignmentAnnotation.CDNA_PROFILE;

477

478

char[] codons = new char[sortedCounts.length];

479

for (int i = 0; i < codons.length; i++)

480

{

481

codons[i] = (char) i;

482

}

483

QuickSort.sort(sortedCounts, codons);

484

int totalPercentage = 0;

485

int distinctValuesCount = 0;

486

int j = 3;

487

int divisor = ignoreGaps ? codonCounts[1] : codonCounts[0];

488

for (int i = codons.length - 1; i >= 0; i--)

489

{

490

final int codonCount = sortedCounts[i];

491

if (codonCount == 0)

492

{

493

break; // nothing else of interest here

494

}

495

distinctValuesCount++;

496

result[j++] = codons[i];

497

final int percentage = codonCount * 100 / divisor;

498

result[j++] = percentage;

499

totalPercentage += percentage;

500

}

501

result[2] = totalPercentage;

502

503

504

* Just return the non-zero values

505

506

// todo next value is redundant if we limit the array to non-zero counts

507

result[1] = distinctValuesCount;

508

return Arrays.copyOfRange(result, 0, j);

}

/**

* Compute a consensus for the cDNA coding for a protein alignment.

513

514

* @param alignment

515

* the protein alignment (which should hold mappings to cDNA

516

* sequences)

517

* @param hconsensus

518

* the consensus data stores to be populated (one per column)

519

520

public static void calculateCdna(AlignmentI alignment,

521

Hashtable[] hconsensus)

522

{

523

final char gapCharacter = alignment.getGapCharacter();

524

List<AlignedCodonFrame> mappings = alignment.getCodonFrames();

525

if (mappings == null || mappings.isEmpty())

{

return;

}

int cols = alignment.getWidth();

531

for (int col = 0; col < cols; col++)

532

{

533

// todo would prefer a Java bean for consensus data

534

Hashtable<String, int[]> columnHash = new Hashtable<String, int[]>();

535

// #seqs, #ungapped seqs, counts indexed by (codon encoded + 1)

536

int[] codonCounts = new int[66];

537

codonCounts[0] = alignment.getSequences().size();

538

int ungappedCount = 0;

539

for (SequenceI seq : alignment.getSequences())

540

{

541

if (seq.getCharAt(col) == gapCharacter)

{

continue;

}

List<char[]> codons = MappingUtils.findCodonsFor(seq, col,

546

mappings);

547

for (char[] codon : codons)

548

{

549

int codonEncoded = CodingUtils.encodeCodon(codon);

550

if (codonEncoded >= 0)

551

{

552

codonCounts[codonEncoded + 2]++;

ungappedCount++;

}

}

}

codonCounts[1] = ungappedCount;

558

// todo: sort values here, save counts and codons?

559

columnHash.put(PROFILE, codonCounts);

560

hconsensus[col] = columnHash;

}

}

/**

* Derive displayable cDNA consensus annotation from computed consensus data.

566

567

* @param consensusAnnotation

568

* the annotation row to be populated for display

569

* @param consensusData

570

* the computed consensus data

571

* @param showProfileLogo

572

* if true show all symbols present at each position, else only the

573

* modal value

574

* @param nseqs

575

* the number of sequences in the alignment

576

577

public static void completeCdnaConsensus(

578

AlignmentAnnotation consensusAnnotation,

579

Hashtable[] consensusData, boolean showProfileLogo, int nseqs)

580

{

581

if (consensusAnnotation == null

582

|| consensusAnnotation.annotations == null

583

|| consensusAnnotation.annotations.length < consensusData.length)

584

{

585

// called with a bad alignment annotation row - wait for it to be

586

// initialised properly

return;

}

// ensure codon triplet scales with font size

591

consensusAnnotation.scaleColLabel = true;

592

for (int col = 0; col < consensusData.length; col++)

593

{

594

Hashtable hci = consensusData[col];

595

if (hci == null)

596

{

597

// gapped protein column?

598

continue;

599

}

600

// array holds #seqs, #ungapped, then codon counts indexed by codon

601

final int[] codonCounts = (int[]) hci.get(PROFILE);

int totalCount = 0;

* First pass - get total count and find the highest

606

607

final char[] codons = new char[codonCounts.length - 2];

608

1690

for (int j = 2; j < codonCounts.length; j++)

609

{

610

1664

final int codonCount = codonCounts[j];

611

1664

codons[j - 2] = (char) (j - 2);

612

1664

totalCount += codonCount;

}

* Sort array of encoded codons by count ascending - so the modal value

617

* goes to the end; start by copying the count (dropping the first value)

618

619

int[] sortedCodonCounts = new int[codonCounts.length - 2];

620

System.arraycopy(codonCounts, 2, sortedCodonCounts, 0,

621

codonCounts.length - 2);

622

QuickSort.sort(sortedCodonCounts, codons);

623

624

int modalCodonEncoded = codons[codons.length - 1];

625

int modalCodonCount = sortedCodonCounts[codons.length - 1];

626

String modalCodon = String

627

.valueOf(CodingUtils.decodeCodon(modalCodonEncoded));

628

if (sortedCodonCounts.length > 1 && sortedCodonCounts[codons.length

629

- 2] == sortedCodonCounts[codons.length - 1])

630

{

631

632

* two or more codons share the modal count

modalCodon = "+";

}

float pid = sortedCodonCounts[sortedCodonCounts.length - 1] * 100

637

/ (float) totalCount;

638

639

640

* todo ? Replace consensus hashtable with sorted arrays of codons and

641

* counts (non-zero only). Include total count in count array [0].

* Scan sorted array backwards for most frequent values first. Show

646

* repeated values compactly.

647

648

StringBuilder mouseOver = new StringBuilder(32);

649

StringBuilder samePercent = new StringBuilder();

650

String percent = null;

651

String lastPercent = null;

652

int percentDecPl = getPercentageDp(nseqs);

653

654

for (int j = codons.length - 1; j >= 0; j--)

655

{

656

int codonCount = sortedCodonCounts[j];

if (codonCount == 0)

{

* remaining codons are 0% - ignore, but finish off the last one if

661

* necessary

662

663

if (samePercent.length() > 0)

664

{

665

mouseOver.append(samePercent).append(": ").append(percent)

.append("% ");

}

break;

}

int codonEncoded = codons[j];

671

final int pct = codonCount * 100 / totalCount;

672

String codon = String

673

.valueOf(CodingUtils.decodeCodon(codonEncoded));

674

StringBuilder sb = new StringBuilder();

675

Format.appendPercentage(sb, pct, percentDecPl);

676

percent = sb.toString();

677

if (showProfileLogo || codonCount == modalCodonCount)

678

{

679

if (percent.equals(lastPercent) && j > 0)

680

{

681

samePercent.append(samePercent.length() == 0 ? "" : ", ");

682

samePercent.append(codon);

}

else

{

if (samePercent.length() > 0)

687

{

688

mouseOver.append(samePercent).append(": ").append(lastPercent)

689

.append("% ");

690

}

691

samePercent.setLength(0);

692

samePercent.append(codon);

693

}

694

lastPercent = percent;

}

}

consensusAnnotation.annotations[col] = new Annotation(modalCodon,

699

mouseOver.toString(), ' ', pid);

}

}

/**

* Returns the number of decimal places to show for profile percentages. For

705

* less than 100 sequences, returns zero (the integer percentage value will be

706

* displayed). For 100-999 sequences, returns 1, for 1000-9999 returns 2, etc.

* @param nseq

* @return

95910

protected static int getPercentageDp(long nseq)

712

{

713

95910

int scale = 0;

714

95910

while (nseq >= 100)

{

scale++;

nseq /= 10;

}

95910

return scale;

720

}

721

}

jalviewX

File AAFrequency.java

Coverage histogram

Code metrics

Classes

Class AAFrequency

Contributing tests

Contributing tests

Source view