File AlignmentUtils.java

Branches:

468

Statements:

928

Methods:

Classes:

LOC:

3,283

NCLOC:

1,991

Total complexity:

358

Complexity density:

0.39

Statements/Method:

15.47

Methods/Class:

Average method complexity:

5.97

Classes

Class	Line #	Total Statements	Complexity	TOTAL Coverage	Actions
AlignmentUtils	80	922	352	0.819694982%
AlignmentUtils.DnaVariant	96	6	6	0.00%

Class AlignmentUtils

Class AlignmentUtils	Line # 80	Total Statements 922	Complexity 352	TOTAL Coverage 0.819694982%
expandContext(AlignmentI,int) : AlignmentI expandContext(AlignmentI,int) : AlignmentI	137137	46.046	10.010	0.983871 0.98387198.4%
getSequenceIndex(AlignmentI,SequenceI) : int getSequenceIndex(AlignmentI,SequenceI) : int	243243	8.08	2.02	1.0 1.0100%
getSequencesByName(AlignmentI) : Map<String, List<SequenceI>> getSequencesByName(AlignmentI) : Map<String, List<SequenceI>>	266266	10.010	3.03	0.9285714 0.928571492.9%
mapProteinAlignmentToCdna(AlignmentI,AlignmentI) : boolean mapProteinAlignmentToCdna(AlignmentI,AlignmentI) : boolean	297297	7.07	3.03	0.7777778 0.777777877.8%
mapProteinToCdna(AlignmentI,AlignmentI,Set<SequenceI>,Set<SequenceI>,boolean) : boolean mapProteinToCdna(AlignmentI,AlignmentI,Set<SequenceI>,Set<SequenceI>,boolean) : boolean	339339	22.022	9.09	0.9375 0.937593.8%
mappingExists(List<AlignedCodonFrame>,SequenceI,SequenceI) : boolean mappingExists(List<AlignedCodonFrame>,SequenceI,SequenceI) : boolean	406406	5.05	3.03	0.6666667 0.666666766.7%
mapCdnaToProtein(SequenceI,SequenceI) : MapList mapCdnaToProtein(SequenceI,SequenceI) : MapList	439439	28.028	12.012	0.95238096 0.9523809695.2%
translatesAs(char[],int,char[]) : boolean translatesAs(char[],int,char[]) : boolean	529529	21.021	14.014	1.0 1.0100%
alignSequenceAs(SequenceI,AlignmentI,String,boolean,boolean) : boolean alignSequenceAs(SequenceI,AlignmentI,String,boolean,boolean) : boolean	606606	14.014	5.05	0.9 0.990%
alignSequenceAs(SequenceI,SequenceI,AlignedCodonFrame,String,char,boolean,boolean) : void alignSequenceAs(SequenceI,SequenceI,AlignedCodonFrame,String,char,boolean,boolean) : void	662662	60.060	20.020	1.0 1.0100%
calculateGapsToInsert(boolean,boolean,int,boolean,int,int,boolean) : int calculateGapsToInsert(boolean,boolean,int,boolean,int,int,boolean) : int	827827	15.015	10.010	1.0 1.0100%
alignProteinAsDna(AlignmentI,AlignmentI) : int alignProteinAsDna(AlignmentI,AlignmentI) : int	891891	6.06	3.03	0.625 0.62562.5%
alignCdsAsProtein(AlignmentI,AlignmentI) : int alignCdsAsProtein(AlignmentI,AlignmentI) : int	917917	18.018	5.05	0.8333333 0.833333383.3%
alignCdsSequenceAsProtein(SequenceI,AlignmentI,List<AlignedCodonFrame>,char) : boolean alignCdsSequenceAsProtein(SequenceI,AlignmentI,List<AlignedCodonFrame>,char) : boolean	963963	48.048	16.016	0.67105263 0.6710526367.1%
buildCodonColumnsMap(AlignmentI,AlignmentI,List<SequenceI>) : Map<AlignedCodon, Map<SequenceI, AlignedCodon>> buildCodonColumnsMap(AlignmentI,AlignmentI,List<SequenceI>) : Map<AlignedCodon, Map<SequenceI, AlignedCodon>>	10941094	13.013	2.02	1.0 1.0100%
addUnmappedPeptideStarts(Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,int) : void addUnmappedPeptideStarts(Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,int) : void	11501150	23.023	6.06	0.93939394 0.9393939493.9%
alignProteinAs(AlignmentI,Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,List<SequenceI>) : int alignProteinAs(AlignmentI,Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,List<SequenceI>) : int	12331233	17.017	2.02	1.0 1.0100%
addCodonPositions(SequenceI,SequenceI,char,Mapping,Map<AlignedCodon, Map<SequenceI, AlignedCodon>>) : void addCodonPositions(SequenceI,SequenceI,char,Mapping,Map<AlignedCodon, Map<SequenceI, AlignedCodon>>) : void	12981298	5.05	4.04	1.0 1.0100%
addCodonToMap(Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,AlignedCodon,SequenceI) : void addCodonToMap(Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,AlignedCodon,SequenceI) : void	13311331	5.05	2.02	1.0 1.0100%
isMappable(AlignmentI,AlignmentI) : boolean isMappable(AlignmentI,AlignmentI) : boolean	13611361	12.012	7.07	1.0 1.0100%
isMappable(SequenceI,SequenceI,List<AlignedCodonFrame>) : boolean isMappable(SequenceI,SequenceI,List<AlignedCodonFrame>) : boolean	14001400	8.08	6.06	0.625 0.62562.5%
findAddableReferenceAnnotations(List<SequenceI>,Map<String, String>,Map<SequenceI, List<AlignmentAnnotation>>,AlignmentI) : void findAddableReferenceAnnotations(List<SequenceI>,Map<String, String>,Map<SequenceI, List<AlignmentAnnotation>>,AlignmentI) : void	14471447	24.024	9.09	0.95 0.9595%
addReferenceAnnotations(Map<SequenceI, List<AlignmentAnnotation>>,AlignmentI,SequenceGroup) : void addReferenceAnnotations(Map<SequenceI, List<AlignmentAnnotation>>,AlignmentI,SequenceGroup) : void	15301530	3.03	1.01	1.0 1.0100%
isSSAnnotationPresent(Map<SequenceI, List<AlignmentAnnotation>>) : boolean isSSAnnotationPresent(Map<SequenceI, List<AlignmentAnnotation>>) : boolean	15431543	4.04	2.02	0.0 0.00%
addReferenceAnnotationTo(AlignmentI,SequenceI,AlignmentAnnotation,SequenceGroup) : AlignmentAnnotation addReferenceAnnotationTo(AlignmentI,SequenceI,AlignmentAnnotation,SequenceGroup) : AlignmentAnnotation	15721572	16.016	4.04	0.95454544 0.9545454495.5%
showOrHideSequenceAnnotations(AlignmentI,Collection<String>,List<SequenceI>,boolean,boolean) : void showOrHideSequenceAnnotations(AlignmentI,Collection<String>,List<SequenceI>,boolean,boolean) : void	16271627	6.06	7.07	0.9166667 0.916666791.7%
showOrHideAutoCalculatedAnnotationsForGroup(AlignmentI,String,SequenceGroup,boolean,boolean) : void showOrHideAutoCalculatedAnnotationsForGroup(AlignmentI,String,SequenceGroup,boolean,boolean) : void	16641664	6.06	7.07	0.0 0.00%
getFirstSequenceAnnotationOfType(AlignmentI,int) : AlignmentAnnotation getFirstSequenceAnnotationOfType(AlignmentI,int) : AlignmentAnnotation	16921692	6.06	4.04	0.0 0.00%
haveCrossRef(SequenceI,SequenceI) : boolean haveCrossRef(SequenceI,SequenceI) : boolean	17141714	1.01	1.01	1.0 1.0100%
hasCrossRef(SequenceI,SequenceI) : boolean hasCrossRef(SequenceI,SequenceI) : boolean	17291729	11.011	6.06	1.0 1.0100%
makeCdsAlignment(SequenceI[],AlignmentI,SequenceI[]) : AlignmentI makeCdsAlignment(SequenceI[],AlignmentI,SequenceI[]) : AlignmentI	17701770	66.066	16.016	0.8913044 0.891304489.1%
transferGeneLoci(SequenceI,MapList,SequenceI) : void transferGeneLoci(SequenceI,MapList,SequenceI) : void	19971997	8.08	4.04	0.9285714 0.928571492.9%
findCdsForProtein(List<AlignedCodonFrame>,SequenceI,List<AlignedCodonFrame>,Mapping) : SequenceI findCdsForProtein(List<AlignedCodonFrame>,SequenceI,List<AlignedCodonFrame>,Mapping) : SequenceI	20352035	19.019	11.011	0.9354839 0.935483993.5%
makeCdsSequence(SequenceI,Mapping,AlignmentI) : SequenceI makeCdsSequence(SequenceI,Mapping,AlignmentI) : SequenceI	21222122	32.032	10.010	0.62 0.6262%
propagateDBRefsToCDS(SequenceI,SequenceI,SequenceI,Mapping) : List<DBRefEntry> propagateDBRefsToCDS(SequenceI,SequenceI,SequenceI,Mapping) : List<DBRefEntry>	22152215	28.028	11.011	0.8863636 0.886363688.6%
transferFeatures(SequenceI,SequenceI,MapList,String,String) : int transferFeatures(SequenceI,SequenceI,MapList,String,String) : int	23032303	33.033	12.012	0.8867925 0.886792588.7%
mapCdsToProtein(SequenceI,SequenceI) : MapList mapCdsToProtein(SequenceI,SequenceI) : MapList	23992399	22.022	5.05	1.0 1.0100%
findCdsPositions(SequenceI) : List<int[]> findCdsPositions(SequenceI) : List<int[]>	24622462	20.020	7.07	0.9285714 0.928571492.9%
makeCopyAlignment(SequenceI[],SequenceI[],AlignmentI) : AlignmentI makeCopyAlignment(SequenceI[],SequenceI[],AlignmentI) : AlignmentI	25302530	21.021	9.09	0.0 0.00%
alignAs(AlignmentI,AlignmentI) : int alignAs(AlignmentI,AlignmentI) : int	25852585	26.026	5.05	0.88235295 0.8823529588.2%
alignAsSameSequences(AlignmentI,AlignmentI) : boolean alignAsSameSequences(AlignmentI,AlignmentI) : boolean	26642664	33.033	7.07	0.88372093 0.8837209388.4%
buildMappedColumnsMap(AlignmentI,AlignmentI,List<SequenceI>) : SortedMap<Integer, Map<SequenceI, Character>> buildMappedColumnsMap(AlignmentI,AlignmentI,List<SequenceI>) : SortedMap<Integer, Map<SequenceI, Character>>	27582758	11.011	3.03	0.93333334 0.9333333493.3%
addMappedPositions(SequenceI,SequenceI,Mapping,Map<Integer, Map<SequenceI, Character>>) : boolean addMappedPositions(SequenceI,SequenceI,Mapping,Map<Integer, Map<SequenceI, Character>>) : boolean	28122812	24.024	11.011	0.8 0.880%
looksLikeEnsembl(AlignmentI) : boolean looksLikeEnsembl(AlignmentI) : boolean	28872887	5.05	3.03	0.71428573 0.7142857371.4%
isSecondaryStructurePresent(AlignmentAnnotation[]) : boolean isSecondaryStructurePresent(AlignmentAnnotation[]) : boolean	29002900	8.08	3.03	0.8333333 0.833333383.3%
getSecondaryStructureAnnotationColour(char) : Color getSecondaryStructureAnnotationColour(char) : Color	29232923	7.07	4.04	0.0 0.00%
findSSAnnotationForGivenSeqposition(AlignmentAnnotation,int) : char findSSAnnotationForGivenSeqposition(AlignmentAnnotation,int) : char	29422942	9.09	5.05	0.93333334 0.9333333493.3%
extractSSSourceInAlignmentAnnotation(AlignmentAnnotation[]) : List<String> extractSSSourceInAlignmentAnnotation(AlignmentAnnotation[]) : List<String>	29692969	11.011	4.04	1.0 1.0100%
extractSSSourceFromAnnotationDescription(AlignmentAnnotation) : String extractSSSourceFromAnnotationDescription(AlignmentAnnotation) : String	30003000	26.026	15.015	0.76086956 0.7608695676.1%
getAlignmentAnnotationForSource(SequenceI,String) : List<AlignmentAnnotation> getAlignmentAnnotationForSource(SequenceI,String) : List<AlignmentAnnotation>	31023102	14.014	6.06	0.95454544 0.9545454495.5%
getSequenceAssociatedAlignmentAnnotations(AlignmentAnnotation[],String) : Map<SequenceI, ArrayList<AlignmentAnnotation>> getSequenceAssociatedAlignmentAnnotations(AlignmentAnnotation[],String) : Map<SequenceI, ArrayList<AlignmentAnnotation>>	31413141	9.09	5.05	0.53333336 0.5333333653.3%
isSecondaryStructureFrom(String,AlignmentAnnotation) : boolean isSecondaryStructureFrom(String,AlignmentAnnotation) : boolean	31783178	8.08	5.05	0.0 0.00%
getSecondaryStructureProviderKey(String) : String getSecondaryStructureProviderKey(String) : String	32043204	4.04	2.02	0.0 0.00%
reduceLabelLength(String) : String reduceLabelLength(String) : String	32193219	3.03	1.01	0.0 0.00%
getSecondaryStructureProviderColor(String) : Color getSecondaryStructureProviderColor(String) : Color	32423242	4.04	2.02	0.0 0.00%
assignSecondaryStructureProviderColor(Map<String, Color>,List<String>) : void assignSecondaryStructureProviderColor(Map<String, Color>,List<String>) : void	32533253	3.03	1.01	0.0 0.00%

Class AlignmentUtils.DnaVariant

Class AlignmentUtils.DnaVariant	Line # 96	Total Statements 6	Complexity 6	TOTAL Coverage 0.00%
DnaVariant(String) DnaVariant(String)	102102	2.02	1.01	0.0 0.00%
DnaVariant(String,SequenceFeature) DnaVariant(String,SequenceFeature)	108108	2.02	1.01	0.0 0.00%
getSource() : String getSource() : String	114114	1.01	2.02	0.0 0.00%
toString() : String toString() : String	122122	1.01	2.02	0.0 0.00%

Contributing tests

This file is covered by 286 tests. .

Contributing tests

Test contribution	Test	Result
0.29464287	jalview.io.CrossRef2xmlTests.openCrossrefsForEnsemblTwicejalview.io.CrossRef2xmlTests.openCrossrefsForEnsemblTwice	1PASS
0.12637363	jalview.analysis.AlignmentUtilsTests.testMakeCdsAlignmentjalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment	1PASS
0.10233516	jalview.bin.CommandsTest.structureImageOutputTestjalview.bin.CommandsTest.structureImageOutputTest	1PASS
0.10233516	jalview.bin.CommandsTest.structureImageOutputTestjalview.bin.CommandsTest.structureImageOutputTest	1PASS
0.100961536	jalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_withXrefsjalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_withXrefs	1PASS
0.100961536	jalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_withStartAndStopCodonsjalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_withStartAndStopCodons	1PASS
0.0989011	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.097527474	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.097527474	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.094093405	jalview.bin.CommandsTest.structureImageAnnotationsOutputTestjalview.bin.CommandsTest.structureImageAnnotationsOutputTest	1PASS
0.094093405	jalview.bin.CommandsTest.structureImageAnnotationsOutputTestjalview.bin.CommandsTest.structureImageAnnotationsOutputTest	1PASS
0.094093405	jalview.bin.CommandsTest.structureImageAnnotationsOutputTestjalview.bin.CommandsTest.structureImageAnnotationsOutputTest	1PASS
0.094093405	jalview.bin.CommandsTest.structureImageAnnotationsOutputTestjalview.bin.CommandsTest.structureImageAnnotationsOutputTest	1PASS
0.094093405	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.094093405	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.09065934	jalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_multipleProteinsjalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_multipleProteins	1PASS
0.09134615	jalview.bin.CommandsTest.structureImageOutputTestjalview.bin.CommandsTest.structureImageOutputTest	1PASS
0.09134615	jalview.bin.CommandsTest.structureImageOutputTestjalview.bin.CommandsTest.structureImageOutputTest	1PASS
0.089972526	jalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_filterProductsjalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_filterProducts	1PASS
0.08791209	jalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_noXrefsjalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_noXrefs	1PASS
0.08585165	jalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_alternativeTranscriptsjalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_alternativeTranscripts	1PASS
0.08379121	jalview.io.FeaturesFileTest.simpleGff3FileLoaderjalview.io.FeaturesFileTest.simpleGff3FileLoader	1PASS
0.08035714	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.08035714	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.08035714	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.08035714	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.078983516	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.07486264	jalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_prioritiseXrefsjalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_prioritiseXrefs	1PASS
0.07348901	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_withIntronsjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_withIntrons	1PASS
0.07074176	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_noIntronsjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_noIntrons	1PASS
0.06662088	jalview.io.FeaturesFileTest.simpleGff3RelaxedIdMatchingjalview.io.FeaturesFileTest.simpleGff3RelaxedIdMatching	1PASS
0.06662088	jalview.io.FeaturesFileTest.readGff3Filejalview.io.FeaturesFileTest.readGff3File	1PASS
0.06662088	jalview.io.FeaturesFileTest.simpleGff3FileClassjalview.io.FeaturesFileTest.simpleGff3FileClass	1PASS
0.06387363	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_keepIntronGapsOnlyjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_keepIntronGapsOnly	1PASS
0.06456044	jalview.datamodel.AlignmentTest.testAlignAs_dnaAsDnajalview.datamodel.AlignmentTest.testAlignAs_dnaAsDna	1PASS
0.06318682	jalview.analysis.AlignmentUtilsTests.testAlignAs_alternateTranscriptsUngappedjalview.analysis.AlignmentUtilsTests.testAlignAs_alternateTranscriptsUngapped	1PASS
0.06387363	jalview.ext.jmol.JmolViewerTest.testAddStrToSingleSeqViewJMoljalview.ext.jmol.JmolViewerTest.testAddStrToSingleSeqViewJMol	1PASS
0.061126374	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_withUnmappedProteinjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_withUnmappedProtein	1PASS
0.059752747	jalview.project.Jalview2xmlTests.testStoreAndRecoverPDBEntryjalview.project.Jalview2xmlTests.testStoreAndRecoverPDBEntry	1PASS
0.059752747	jalview.io.AnnotatedPDBFileInputTest.testJalviewProjectRelocationAnnotationjalview.io.AnnotatedPDBFileInputTest.testJalviewProjectRelocationAnnotation	1PASS
0.059752747	jalview.ext.jmol.JmolViewerTest.testSingleSeqViewJMoljalview.ext.jmol.JmolViewerTest.testSingleSeqViewJMol	1PASS
0.059752747	jalview.ext.jmol.JmolParserTest.testAlignmentLoaderjalview.ext.jmol.JmolParserTest.testAlignmentLoader	1PASS
0.06043956	jalview.analysis.AlignmentUtilsTests.testAlignProteinAsDna_incompleteStartCodonjalview.analysis.AlignmentUtilsTests.testAlignProteinAsDna_incompleteStartCodon	1PASS
0.057692308	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.057692308	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.057692308	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.057005495	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withTrailingPeptidejalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withTrailingPeptide	1PASS
0.057692308	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.05631868	jalview.gui.AnnotationLabelsTest2.testIdWidthNoChangesjalview.gui.AnnotationLabelsTest2.testIdWidthNoChanges	1PASS
0.05631868	jalview.gui.AnnotationLabelsTest2.testIdWidthNoChangesjalview.gui.AnnotationLabelsTest2.testIdWidthNoChanges	1PASS
0.05631868	jalview.gui.AnnotationLabelsTest2.testIdWidthChangesjalview.gui.AnnotationLabelsTest2.testIdWidthChanges	1PASS
0.05631868	jalview.gui.AnnotationLabelsTest2.testIdWidthChangesjalview.gui.AnnotationLabelsTest2.testIdWidthChanges	1PASS
0.054945055	jalview.analysis.AlignmentUtilsTests.testAlignProteinAsDnajalview.analysis.AlignmentUtilsTests.testAlignProteinAsDna	1PASS
0.054258242	jalview.datamodel.AlignmentTest.testAlignAs_proteinAsCdnajalview.datamodel.AlignmentTest.testAlignAs_proteinAsCdna	1PASS
0.052197803	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_mappedProteinProteinjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_mappedProteinProtein	1PASS
0.050137363	jalview.datamodel.AlignmentTest.testAlignAs_cdnaAsProteinjalview.datamodel.AlignmentTest.testAlignAs_cdnaAsProtein	1PASS
0.050824177	jalview.analysis.AlignmentUtilsTests.testIsMappablejalview.analysis.AlignmentUtilsTests.testIsMappable	1PASS
0.048763737	jalview.datamodel.AlignmentTest.testAlignAs_cdnaAsProtein_singleSequencejalview.datamodel.AlignmentTest.testAlignAs_cdnaAsProtein_singleSequence	1PASS
0.048763737	jalview.project.Jalview2xmlTests.testRNAStructureRecoveryjalview.project.Jalview2xmlTests.testRNAStructureRecovery	1PASS
0.039835166	jalview.analysis.AlignmentUtilsTests.testExpandContextjalview.analysis.AlignmentUtilsTests.testExpandContext	1PASS
0.037087914	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInEitherOneSeqjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInEitherOneSeq	1PASS
0.037774727	jalview.io.AnnotatedPDBFileInputTest.checkNoDuplicatesjalview.io.AnnotatedPDBFileInputTest.checkNoDuplicates	1PASS
0.03846154	jalview.analysis.AlignmentUtilsTests.testMapCdsToProteinjalview.analysis.AlignmentUtilsTests.testMapCdsToProtein	1PASS
0.037087914	jalview.project.Jalview2xmlTests.testPAEsaveRestorejalview.project.Jalview2xmlTests.testPAEsaveRestore	1PASS
0.037774727	jalview.analysis.AlignmentUtilsTests.testAddReferenceContactMapjalview.analysis.AlignmentUtilsTests.testAddReferenceContactMap	1PASS
0.035714287	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withGapjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withGap	1PASS
0.033653848	jalview.analysis.AlignmentUtilsTests.testAddReferenceAnnotationsjalview.analysis.AlignmentUtilsTests.testAddReferenceAnnotations	1PASS
0.03228022	jalview.analysis.AlignmentUtilsTests.testExpandContext_annotationjalview.analysis.AlignmentUtilsTests.testExpandContext_annotation	1PASS
0.03021978	jalview.analysis.AlignmentUtilsTests.testMapCdnaToProtein_forSubsequencejalview.analysis.AlignmentUtilsTests.testMapCdnaToProtein_forSubsequence	1PASS
0.026098901	jalview.analysis.AlignmentUtilsTests.testAlignAsSameSequencesjalview.analysis.AlignmentUtilsTests.testAlignAsSameSequences	1PASS
0.026098901	jalview.analysis.AlignmentUtilsTests.testTranslatesAsjalview.analysis.AlignmentUtilsTests.testTranslatesAs	1PASS
0.026785715	jalview.analysis.AlignmentUtilsTests.testTransferFeaturesjalview.analysis.AlignmentUtilsTests.testTransferFeatures	1PASS
0.025412088	jalview.analysis.AlignmentUtilsTests.testAlignAsSameSequencesMultipleSubSeqjalview.analysis.AlignmentUtilsTests.testAlignAsSameSequencesMultipleSubSeq	1PASS
0.024038462	jalview.project.Jalview2xmlTests.testAutoShowOverviewForLegacyProjectsjalview.project.Jalview2xmlTests.testAutoShowOverviewForLegacyProjects	1PASS
0.024725275	jalview.analysis.AlignmentUtilsTests.testTransferFeatures_withOmitjalview.analysis.AlignmentUtilsTests.testTransferFeatures_withOmit	1PASS
0.023351649	jalview.gui.AlignViewportTest.testGetSelectionAsNewSequences_withContactMatricesjalview.gui.AlignViewportTest.testGetSelectionAsNewSequences_withContactMatrices	1PASS
0.023351649	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInBothSeqsjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInBothSeqs	1PASS
0.024038462	jalview.project.Jalview2xmlTests.gatherViewsHerejalview.project.Jalview2xmlTests.gatherViewsHere	1PASS
0.024725275	jalview.project.Jalview2xmlTests.testStoreAndRecoverColourThresholdsjalview.project.Jalview2xmlTests.testStoreAndRecoverColourThresholds	1PASS
0.024038462	jalview.project.Jalview2xmlTests.testStoreAndRecoverReferenceSeqSettingsjalview.project.Jalview2xmlTests.testStoreAndRecoverReferenceSeqSettings	1PASS
0.024725275	jalview.project.Jalview2xmlTests.testTCoffeeScoresjalview.project.Jalview2xmlTests.testTCoffeeScores	1PASS
0.024725275	jalview.gui.AlignFrameTest.testNewView_colourThresholdsjalview.gui.AlignFrameTest.testNewView_colourThresholds	1PASS
0.024725275	jalview.gui.ColourMenuHelperTest.testAddMenuItems_nucleotidejalview.gui.ColourMenuHelperTest.testAddMenuItems_nucleotide	1PASS
0.024038462	jalview.io.JSONFileTest.testBioJSONRoundTripWithColourSchemeNonejalview.io.JSONFileTest.testBioJSONRoundTripWithColourSchemeNone	1PASS
0.024038462	jalview.project.Jalview2xmlTests.testStoreAndRecoverExpandedviewsjalview.project.Jalview2xmlTests.testStoreAndRecoverExpandedviews	1PASS
0.024038462	jalview.project.Jalview2xmlTests.noDuplicatePdbMappingsMadejalview.project.Jalview2xmlTests.noDuplicatePdbMappingsMade	1PASS
0.024038462	jalview.project.Jalview2xmlTests.testCopyViewSettingsjalview.project.Jalview2xmlTests.testCopyViewSettings	1PASS
0.024038462	jalview.project.Jalview2xmlTests.testStoreAndRestoreIDwidthAndAnnotationHeightjalview.project.Jalview2xmlTests.testStoreAndRestoreIDwidthAndAnnotationHeight	1PASS
0.024725275	jalview.project.Jalview2xmlTests.testColourByAnnotScoresjalview.project.Jalview2xmlTests.testColourByAnnotScores	1PASS
0.023351649	jalview.project.Jalview2xmlTests.testStoreAndRecoverAnnotationRowElementColoursjalview.project.Jalview2xmlTests.testStoreAndRecoverAnnotationRowElementColours	1PASS
0.024038462	jalview.project.Jalview2xmlTests.viewRefPdbAnnotationjalview.project.Jalview2xmlTests.viewRefPdbAnnotation	1PASS
0.02129121	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.021978023	jalview.analysis.AlignmentUtilsTests.testAddMappedPositions_withStopCodonjalview.analysis.AlignmentUtilsTests.testAddMappedPositions_withStopCodon	1PASS
0.021978023	jalview.analysis.AlignmentUtilsTests.testAddMappedPositionsjalview.analysis.AlignmentUtilsTests.testAddMappedPositions	1PASS
0.020604396	jalview.analysis.AlignmentUtilsTests.testTransferFeatures_withSelectjalview.analysis.AlignmentUtilsTests.testTransferFeatures_withSelect	1PASS
0.02129121	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.02129121	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01923077	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_notOnAlignmentjalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_notOnAlignment	1PASS
0.01923077	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenujalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu	1PASS
0.019917583	jalview.analysis.AlignmentUtilsTests.testFindCdsForProtein_noUTRjalview.analysis.AlignmentUtilsTests.testFindCdsForProtein_noUTR	1PASS
0.018543957	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_alreadyAddedjalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_alreadyAdded	1PASS
0.018543957	jalview.io.AnnotationFileIOTest.exampleAnnotationFileIOjalview.io.AnnotationFileIOTest.exampleAnnotationFileIO	1PASS
0.01717033	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01717033	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01717033	jalview.io.vcf.VCFLoaderTest.testDoLoad_reverseStrandjalview.io.vcf.VCFLoaderTest.testDoLoad_reverseStrand	1PASS
0.01717033	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistances_withParamsjalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistances_withParams	1PASS
0.01717033	jalview.gui.SeqPanelTest.testFindColumn_and_FindAlignmentColumn_wrappedjalview.gui.SeqPanelTest.testFindColumn_and_FindAlignmentColumn_wrapped	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.gui.SeqPanelTest.testFindColumn_unwrappedjalview.gui.SeqPanelTest.testFindColumn_unwrapped	1PASS
0.01717033	jalview.analysis.AverageDistanceEngineTest.testUPGMAEnginejalview.analysis.AverageDistanceEngineTest.testUPGMAEngine	1PASS
0.01717033	jalview.renderer.seqfeatures.FeatureRendererTest.testFindComplementFeaturesAtResiduejalview.renderer.seqfeatures.FeatureRendererTest.testFindComplementFeaturesAtResidue	1PASS
0.01717033	jalview.io.AnnotationFileIOTest.testAnnotateAlignmentViewjalview.io.AnnotationFileIOTest.testAnnotateAlignmentView	1PASS
0.01717033	jalview.project.Jalview2xmlTests.testSaveLoadFeatureColoursAndFiltersjalview.project.Jalview2xmlTests.testSaveLoadFeatureColoursAndFilters	1PASS
0.01717033	jalview.gui.QuitHandlerTest.testUnsavedChangesjalview.gui.QuitHandlerTest.testUnsavedChanges	1PASS
0.01717033	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.01717033	jalview.io.vcf.VCFLoaderTest.testDoLoadjalview.io.vcf.VCFLoaderTest.testDoLoad	1PASS
0.01717033	jalview.datamodel.AlignmentViewTest.testGetVisibleContigsjalview.datamodel.AlignmentViewTest.testGetVisibleContigs	1PASS
0.01717033	jalview.schemes.ClustalxColourSchemeTest.testFindColourjalview.schemes.ClustalxColourSchemeTest.testFindColour	1PASS
0.01717033	jalview.gui.AlignViewportTest.testSetGetHasSearchResultsjalview.gui.AlignViewportTest.testSetGetHasSearchResults	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_hiddenFirstColumnjalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_hiddenFirstColumn	1PASS
0.01717033	jalview.renderer.seqfeatures.FeatureRendererTest.testFindFeaturesAtColumnjalview.renderer.seqfeatures.FeatureRendererTest.testFindFeaturesAtColumn	1PASS
0.01717033	jalview.io.BackupFilesTest.backupsEnabledRollMaxTestjalview.io.BackupFilesTest.backupsEnabledRollMaxTest	1PASS
0.01717033	jalview.io.JalviewExportPropertiesTests.testImportExportPeriodGapsjalview.io.JalviewExportPropertiesTests.testImportExportPeriodGaps	1PASS
0.01717033	jalview.project.Jalview2xmlTests.testStoreAndRecoverGroupRepSeqsjalview.project.Jalview2xmlTests.testStoreAndRecoverGroupRepSeqs	1PASS
0.01717033	jalview.gui.QuitHandlerTest.testWaitForSaveQuitjalview.gui.QuitHandlerTest.testWaitForSaveQuit	1PASS
0.01717033	jalview.io.JSONFileTest.testGrpParsed_colourNonejalview.io.JSONFileTest.testGrpParsed_colourNone	1PASS
0.01717033	jalview.project.Jalview2xmlTests.testStoreAndRecoverNoOverviewjalview.project.Jalview2xmlTests.testStoreAndRecoverNoOverview	1PASS
0.01717033	jalview.gui.AlignViewportTest.testSetSelectionGroupjalview.gui.AlignViewportTest.testSetSelectionGroup	1PASS
0.01717033	jalview.schemes.ClustalxColourSchemeTest.testFindColour_ignoreGapsjalview.schemes.ClustalxColourSchemeTest.testFindColour_ignoreGaps	1PASS
0.01717033	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModeljalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel	1PASS
0.01717033	jalview.project.Jalview2xmlTests.testPcaViewAssociationjalview.project.Jalview2xmlTests.testPcaViewAssociation	1PASS
0.01717033	jalview.gui.AlignViewportTest.testDeregisterMapping_withNoReferencejalview.gui.AlignViewportTest.testDeregisterMapping_withNoReference	1PASS
0.01717033	jalview.analysis.AlignmentUtilsTests.testFindCdsForProteinjalview.analysis.AlignmentUtilsTests.testFindCdsForProtein	1PASS
0.01717033	jalview.io.BackupFilesTest.backupsEnabledSingleFileBackupTestjalview.io.BackupFilesTest.backupsEnabledSingleFileBackupTest	1PASS
0.01717033	jalview.schemes.ColourSchemesTest.testRegisterColourSchemejalview.schemes.ColourSchemesTest.testRegisterColourScheme	1PASS
0.01717033	jalview.gui.ColourMenuHelperTest.testAddMenuItems_forAlignFramejalview.gui.ColourMenuHelperTest.testAddMenuItems_forAlignFrame	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.gui.QuitHandlerTest.testInstantQuitjalview.gui.QuitHandlerTest.testInstantQuit	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.io.FeaturesFileTest.testPrintJalviewFormatjalview.io.FeaturesFileTest.testPrintJalviewFormat	1PASS
0.01717033	jalview.gui.AlignViewportTest.testGetConsensusSeqjalview.gui.AlignViewportTest.testGetConsensusSeq	1PASS
0.01717033	jalview.gui.QuitHandlerTest.testNoGUIUnsavedChangesjalview.gui.QuitHandlerTest.testNoGUIUnsavedChanges	1PASS
0.01717033	jalview.gui.ScalePanelTest.testBuildPopupMenujalview.gui.ScalePanelTest.testBuildPopupMenu	1PASS
0.01717033	jalview.io.FeaturesFileTest.testPrintJalviewFormat_withFiltersjalview.io.FeaturesFileTest.testPrintJalviewFormat_withFilters	1PASS
0.01717033	jalview.schemes.ColourSchemesTest.testGetColourSchemejalview.schemes.ColourSchemesTest.testGetColourScheme	1PASS
0.01717033	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.01717033	jalview.gui.SeqPanelTest.testFindMousePosition_wrapped_annotationsjalview.gui.SeqPanelTest.testFindMousePosition_wrapped_annotations	1PASS
0.01717033	jalview.io.gff.GffTests.testResolveExonerateGffjalview.io.gff.GffTests.testResolveExonerateGff	1PASS
0.01717033	jalview.renderer.ScaleRendererTest.testCalculateMarksjalview.renderer.ScaleRendererTest.testCalculateMarks	1PASS
0.01717033	jalview.ext.jmol.JmolCommandsTest.testGetColourBySequenceCommands_hiddenColumnsjalview.ext.jmol.JmolCommandsTest.testGetColourBySequenceCommands_hiddenColumns	1PASS
0.01717033	jalview.gui.AlignViewportTest.testSetGlobalColourSchemejalview.gui.AlignViewportTest.testSetGlobalColourScheme	1PASS
0.01717033	jalview.structures.models.AAStructureBindingModelTest.testBuildColoursMapjalview.structures.models.AAStructureBindingModelTest.testBuildColoursMap	1PASS
0.01717033	jalview.renderer.seqfeatures.FeatureRendererTest.testFilterFeaturesForDisplayjalview.renderer.seqfeatures.FeatureRendererTest.testFilterFeaturesForDisplay	1PASS
0.01717033	jalview.io.TCoffeeScoreFileTest.testGetAsArrayjalview.io.TCoffeeScoreFileTest.testGetAsArray	1PASS
0.01717033	jalview.renderer.seqfeatures.FeatureRendererTest.testFindAllFeaturesjalview.renderer.seqfeatures.FeatureRendererTest.testFindAllFeatures	1PASS
0.01717033	jalview.bin.CommandsTest.structureImageAnnotationsOutputTestjalview.bin.CommandsTest.structureImageAnnotationsOutputTest	1PASS
0.01717033	jalview.bin.CommandsTest.structureImageAnnotationsOutputTestjalview.bin.CommandsTest.structureImageAnnotationsOutputTest	1PASS
0.01717033	jalview.io.BackupFilesTest.backupsEnabledNoRollMaxTestjalview.io.BackupFilesTest.backupsEnabledNoRollMaxTest	1PASS
0.01717033	jalview.gui.SeqPanelTest.testAmbiguousAminoAcidGetsStatusMessagejalview.gui.SeqPanelTest.testAmbiguousAminoAcidGetsStatusMessage	1PASS
0.01717033	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.01717033	jalview.gui.AlignFrameTest.testHideFeatureColumnsjalview.gui.AlignFrameTest.testHideFeatureColumns	1PASS
0.01717033	jalview.gui.ScalePanelTest.testSelectColumns_withHiddenjalview.gui.ScalePanelTest.testSelectColumns_withHidden	1PASS
0.01717033	jalview.gui.SeqPanelTest.testFindMousePosition_wrapped_noAnnotationsjalview.gui.SeqPanelTest.testFindMousePosition_wrapped_noAnnotations	1PASS
0.01717033	jalview.io.WindowsFileLoadAndSaveTest.loadAndSaveAlignmentjalview.io.WindowsFileLoadAndSaveTest.loadAndSaveAlignment	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.structure.StructureMappingTest.testEqualsjalview.structure.StructureMappingTest.testEquals	1PASS
0.01717033	jalview.renderer.seqfeatures.FeatureRendererTest.testIsVisiblejalview.renderer.seqfeatures.FeatureRendererTest.testIsVisible	1PASS
0.01717033	jalview.bin.CommandsTest.structureImageAnnotationsOutputTestjalview.bin.CommandsTest.structureImageAnnotationsOutputTest	1PASS
0.01717033	jalview.project.Jalview2xmlTests.testStoreAndRecoverOverviewjalview.project.Jalview2xmlTests.testStoreAndRecoverOverview	1PASS
0.01717033	jalview.io.BackupFilesTest.backupsEnabledReverseRollMaxTestjalview.io.BackupFilesTest.backupsEnabledReverseRollMaxTest	1PASS
0.01717033	jalview.io.FeaturesFileTest.testPrintGffFormatjalview.io.FeaturesFileTest.testPrintGffFormat	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.gui.FeatureSettingsTest.testSaveLoadjalview.gui.FeatureSettingsTest.testSaveLoad	1PASS
0.01717033	jalview.project.Jalview2xmlTests.testMergeDatasetsforViewsjalview.project.Jalview2xmlTests.testMergeDatasetsforViews	1PASS
0.01717033	jalview.schemes.PIDColourSchemeTest.testFindColour_ignoreGapsjalview.schemes.PIDColourSchemeTest.testFindColour_ignoreGaps	1PASS
0.01717033	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_HiddenColumnsjalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_HiddenColumns	1PASS
0.01717033	jalview.gui.AlignViewportTest.testUpdateConservation_qualityOnlyjalview.gui.AlignViewportTest.testUpdateConservation_qualityOnly	1PASS
0.01717033	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.01717033	jalview.controller.AlignViewControllerTest.testFindColumnsWithFeaturejalview.controller.AlignViewControllerTest.testFindColumnsWithFeature	1PASS
0.01717033	jalview.renderer.seqfeatures.FeatureRendererTest.testGetColourjalview.renderer.seqfeatures.FeatureRendererTest.testGetColour	1PASS
0.01717033	jalview.gui.PairwiseAlignmentPanelTest.testConstructor_noSelectionGroupjalview.gui.PairwiseAlignmentPanelTest.testConstructor_noSelectionGroup	1PASS
0.01717033	jalview.io.FeaturesFileTest.testParse_mixedJalviewGffjalview.io.FeaturesFileTest.testParse_mixedJalviewGff	1PASS
0.01717033	jalview.gui.QuitHandlerTest.testForceQuitjalview.gui.QuitHandlerTest.testForceQuit	1PASS
0.01717033	jalview.io.FeaturesFileTest.testParse_jalviewFeaturesOnlyjalview.io.FeaturesFileTest.testParse_jalviewFeaturesOnly	1PASS
0.01717033	jalview.gui.DesktopTests.testInternalCopyPastejalview.gui.DesktopTests.testInternalCopyPaste	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.analysis.AlignmentUtilsTests.testFindCdsPositions_fivePrimeIncompletejalview.analysis.AlignmentUtilsTests.testFindCdsPositions_fivePrimeIncomplete	1PASS
0.01717033	jalview.io.BackupFilesTest.noBackupsEnabledTestjalview.io.BackupFilesTest.noBackupsEnabledTest	1PASS
0.01717033	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.01717033	jalview.io.vcf.VCFLoaderTest.testDoLoad_vepCsqjalview.io.vcf.VCFLoaderTest.testDoLoad_vepCsq	1PASS
0.01717033	jalview.bin.CommandsTest2.structureOpeningArgsTestjalview.bin.CommandsTest2.structureOpeningArgsTest	1PASS
0.01717033	jalview.gui.AlignmentPanelTest.testSetOverviewTitle_automaticOverviewjalview.gui.AlignmentPanelTest.testSetOverviewTitle_automaticOverview	1PASS
0.01717033	jalview.io.FeaturesFileTest.testPrintGffFormat_withFiltersjalview.io.FeaturesFileTest.testPrintGffFormat_withFilters	1PASS
0.01717033	jalview.gui.AlignViewportTest.testShowOrDontShowOccupancyjalview.gui.AlignViewportTest.testShowOrDontShowOccupancy	1PASS
0.01717033	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01717033	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.01717033	jalview.project.Jalview2xmlTests.testStoreAndRecoverGeneLocusjalview.project.Jalview2xmlTests.testStoreAndRecoverGeneLocus	1PASS
0.01717033	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.01717033	jalview.gui.QuitHandlerTest.testSavedProjectChangesjalview.gui.QuitHandlerTest.testSavedProjectChanges	1PASS
0.01717033	jalview.project.Jalview2xmlTests.testMergeDatasetsforManyViewsjalview.project.Jalview2xmlTests.testMergeDatasetsforManyViews	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.01717033	jalview.io.FeaturesFileTest.testParsejalview.io.FeaturesFileTest.testParse	1PASS
0.01717033	jalview.bin.CommandsTest.structureImageAnnotationsOutputTestjalview.bin.CommandsTest.structureImageAnnotationsOutputTest	1PASS
0.01717033	jalview.io.AnnotationExporterTest.testAnnotationExportAsCSVjalview.io.AnnotationExporterTest.testAnnotationExportAsCSV	1PASS
0.01717033	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01717033	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01717033	jalview.gui.AlignViewportTest.testDeregisterMapping_onCloseViewjalview.gui.AlignViewportTest.testDeregisterMapping_onCloseView	1PASS
0.01717033	jalview.io.gff.ExonerateHelperTest.testAddExonerateGffToAlignmentjalview.io.gff.ExonerateHelperTest.testAddExonerateGffToAlignment	1PASS
0.01717033	jalview.gui.SeqPanelTest.testFindMousePosition_wrapped_scaleAbovejalview.gui.SeqPanelTest.testFindMousePosition_wrapped_scaleAbove	1PASS
0.01717033	jalview.io.FeaturesFileTest.testParse_pureGff3jalview.io.FeaturesFileTest.testParse_pureGff3	1PASS
0.01717033	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01717033	jalview.gui.SeqPanelTest.testFindMousePosition_wrapped_scales_longSequencejalview.gui.SeqPanelTest.testFindMousePosition_wrapped_scales_longSequence	1PASS
0.01717033	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFindFeatureAt_PointFeaturejalview.analysis.scoremodels.FeatureDistanceModelTest.testFindFeatureAt_PointFeature	1PASS
0.01717033	jalview.gui.AlignViewportTest.testDeregisterMapping_withReferencejalview.gui.AlignViewportTest.testDeregisterMapping_withReference	1PASS
0.01717033	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01717033	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistances	1PASS
0.01717033	jalview.gui.QuitHandlerTest.testSavedAlignmentChangesjalview.gui.QuitHandlerTest.testSavedAlignmentChanges	1PASS
0.01717033	jalview.gui.ScalePanelTest.testPreventNegativeStartColumnjalview.gui.ScalePanelTest.testPreventNegativeStartColumn	1PASS
0.01717033	jalview.gui.PairwiseAlignmentPanelTest.testConstructor_withSelectionGroupjalview.gui.PairwiseAlignmentPanelTest.testConstructor_withSelectionGroup	1PASS
0.01717033	jalview.gui.AlignFrameTest.testNewView_dsRefPreservedjalview.gui.AlignFrameTest.testNewView_dsRefPreserved	1PASS
0.01717033	jalview.controller.AlignViewControllerTest.testSelectColumnsWithHighlightjalview.controller.AlignViewControllerTest.testSelectColumnsWithHighlight	1PASS
0.01717033	jalview.gui.AlignmentPanelTest.testSetOverviewTitlejalview.gui.AlignmentPanelTest.testSetOverviewTitle	1PASS
0.013049451	jalview.analysis.AlignmentUtilsTests.testFindCdsPositionsjalview.analysis.AlignmentUtilsTests.testFindCdsPositions	1PASS
0.013736264	jalview.analysis.AlignmentUtilsTests.testHasCrossRefjalview.analysis.AlignmentUtilsTests.testHasCrossRef	1PASS
0.013736264	jalview.analysis.AlignmentUtilsTests.testHaveCrossRefjalview.analysis.AlignmentUtilsTests.testHaveCrossRef	1PASS
0.012362638	jalview.datamodel.PAEContactMatrixTest.testSeqAssociatedPAEMatrixjalview.datamodel.PAEContactMatrixTest.testSeqAssociatedPAEMatrix	1PASS
0.010989011	jalview.util.MappingUtilsTest.testMapColumnSelection_nulljalview.util.MappingUtilsTest.testMapColumnSelection_null	1PASS
0.010989011	jalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_zappojalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_zappo	1PASS
0.010989011	jalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsAndHiddenColumnsjalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsAndHiddenColumns	1PASS
0.010989011	jalview.analysis.FinderTest.testFind_inDescriptionjalview.analysis.FinderTest.testFind_inDescription	1PASS
0.010989011	jalview.util.MappingUtilsTest.testMapSequenceGroup_regionjalview.util.MappingUtilsTest.testMapSequenceGroup_region	1PASS
0.010989011	jalview.analysis.FinderTest.testFindAll_sequenceIdsjalview.analysis.FinderTest.testFindAll_sequenceIds	1PASS
0.010989011	jalview.gui.SeqPanelTest.testSetStatusReturnsNearestResiduePositionjalview.gui.SeqPanelTest.testSetStatusReturnsNearestResiduePosition	1PASS
0.010989011	jalview.util.MappingUtilsTest.testMapSequenceGroup_columnsjalview.util.MappingUtilsTest.testMapSequenceGroup_columns	1PASS
0.010989011	jalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_nonejalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_none	1PASS
0.010989011	jalview.analysis.DnaTest.testReverseCdnajalview.analysis.DnaTest.testReverseCdna	1PASS
0.010989011	jalview.util.MappingUtilsTest.testMapColumnSelection_dnaToProteinjalview.util.MappingUtilsTest.testMapColumnSelection_dnaToProtein	1PASS
0.010989011	jalview.util.MappingUtilsTest.testMapColumnSelection_hiddenColumnsjalview.util.MappingUtilsTest.testMapColumnSelection_hiddenColumns	1PASS
0.010989011	jalview.util.MappingUtilsTest.testMapColumnSelection_proteinToDnajalview.util.MappingUtilsTest.testMapColumnSelection_proteinToDna	1PASS
0.010989011	jalview.renderer.ResidueColourFinderTest.testGetResidueColour_zappojalview.renderer.ResidueColourFinderTest.testGetResidueColour_zappo	1PASS
0.010989011	jalview.datamodel.HiddenSequencesTest.testHideShowSequence_withHiddenRepSequencejalview.datamodel.HiddenSequencesTest.testHideShowSequence_withHiddenRepSequence	1PASS
0.010989011	jalview.renderer.ResidueColourFinderTest.testGetResidueColour_nonejalview.renderer.ResidueColourFinderTest.testGetResidueColour_none	1PASS
0.010989011	jalview.renderer.ResidueColourFinderTest.testGetResidueColour_userdefjalview.renderer.ResidueColourFinderTest.testGetResidueColour_userdef	1PASS
0.010989011	jalview.util.MappingUtilsTest.testMapSequenceGroup_sharedDatasetjalview.util.MappingUtilsTest.testMapSequenceGroup_sharedDataset	1PASS
0.010989011	jalview.gui.PaintRefresherTest.testGetAssociatedPanelsjalview.gui.PaintRefresherTest.testGetAssociatedPanels	1PASS
0.010989011	jalview.util.MappingUtilsTest.testMapSequenceGroup_sequencesjalview.util.MappingUtilsTest.testMapSequenceGroup_sequences	1PASS
0.010989011	jalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_userdefjalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_userdef	1PASS
0.009615385	jalview.analysis.AlignmentUtilsTests.testGetSequencesByNamejalview.analysis.AlignmentUtilsTests.testGetSequencesByName	1PASS
0.009615385	jalview.analysis.AlignmentUtilsTests.testTransferGeneLocijalview.analysis.AlignmentUtilsTests.testTransferGeneLoci	1PASS
0.006868132	jalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSourcesjalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSources	1PASS
0.007554945	jalview.gui.PopupMenuTest.testHideInsertionsjalview.gui.PopupMenuTest.testHideInsertions	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testSelectType_hideForAlljalview.gui.AnnotationChooserTest.testSelectType_hideForAll	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testSelectType_hideForSelectedjalview.gui.AnnotationChooserTest.testSelectType_hideForSelected	1PASS
0.008241759	jalview.analysis.AlignmentUtilsTests.testShowOrHideSequenceAnnotationsjalview.analysis.AlignmentUtilsTests.testShowOrHideSequenceAnnotations	1PASS
0.007554945	jalview.analysis.AnnotationSorterTest.testNoSort_autocalcFirstjalview.analysis.AnnotationSorterTest.testNoSort_autocalcFirst	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testDeselectType_showForAlljalview.gui.AnnotationChooserTest.testDeselectType_showForAll	1PASS
0.007554945	jalview.analysis.AnnotationSorterTest.testSort_timingUnsortedjalview.analysis.AnnotationSorterTest.testSort_timingUnsorted	1PASS
0.007554945	jalview.analysis.AnnotationSorterTest.testSortByTypeAndSequence_autocalcLastjalview.analysis.AnnotationSorterTest.testSortByTypeAndSequence_autocalcLast	1PASS
0.007554945	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_noReferenceAnnotationsjalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_noReferenceAnnotations	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testDeselectType_hideForAlljalview.gui.AnnotationChooserTest.testDeselectType_hideForAll	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testIsInActionScope_selectedScopejalview.gui.AnnotationChooserTest.testIsInActionScope_selectedScope	1PASS
0.007554945	jalview.analysis.AnnotationSorterTest.testSortBySequenceAndType_autocalcLastjalview.analysis.AnnotationSorterTest.testSortBySequenceAndType_autocalcLast	1PASS
0.006181319	jalview.analysis.GroupingTest.testMakeGroupsWithBothjalview.analysis.GroupingTest.testMakeGroupsWithBoth	1PASS
0.006181319	jalview.workers.AlignCalcManagerTest.testRemoveWorkerForAnnotationjalview.workers.AlignCalcManagerTest.testRemoveWorkerForAnnotation	1PASS
0.006868132	jalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSourcesjalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSources	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testDeselectType_showForSelectedjalview.gui.AnnotationChooserTest.testDeselectType_showForSelected	1PASS
0.007554945	jalview.io.AnnotatedPDBFileInputTest.checkPDBSequenceFeaturesjalview.io.AnnotatedPDBFileInputTest.checkPDBSequenceFeatures	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testIsInActionScope_unselectedScopejalview.gui.AnnotationChooserTest.testIsInActionScope_unselectedScope	1PASS
0.007554945	jalview.analysis.AnnotationSorterTest.testSort_timingSemisortedjalview.analysis.AnnotationSorterTest.testSort_timingSemisorted	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testSelectType_showForSelectedjalview.gui.AnnotationChooserTest.testSelectType_showForSelected	1PASS
0.007554945	jalview.analysis.AnnotationSorterTest.testSortBySequenceAndType_autocalcFirstjalview.analysis.AnnotationSorterTest.testSortBySequenceAndType_autocalcFirst	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testDeselectType_hideForSelectedjalview.gui.AnnotationChooserTest.testDeselectType_hideForSelected	1PASS
0.007554945	jalview.gui.AlignFrameTest.testChangeColour_background_groupsAndThresholdsjalview.gui.AlignFrameTest.testChangeColour_background_groupsAndThresholds	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testResetOriginalStatejalview.gui.AnnotationChooserTest.testResetOriginalState	1PASS
0.007554945	jalview.analysis.AnnotationSorterTest.testSortByTypeAndSequence_autocalcFirstjalview.analysis.AnnotationSorterTest.testSortByTypeAndSequence_autocalcFirst	1PASS
0.007554945	jalview.gui.AnnotationColumnChooserTest.testResetjalview.gui.AnnotationColumnChooserTest.testReset	1PASS
0.007554945	jalview.gui.AnnotationChooserTest.testSelectType_showForAlljalview.gui.AnnotationChooserTest.testSelectType_showForAll	1PASS
0.007554945	jalview.analysis.AnnotationSorterTest.testSort_timingPresortedjalview.analysis.AnnotationSorterTest.testSort_timingPresorted	1PASS
0.0054945056	jalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSourcesjalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSources	1PASS
0.006181319	jalview.ext.jmol.JmolParserTest.testFileParserjalview.ext.jmol.JmolParserTest.testFileParser	1PASS
0.0041208793	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_noSequenceSelectedjalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_noSequenceSelected	1PASS

Source view

* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)

* Copyright (C) $$Year-Rel$$ The Jalview Authors

* This file is part of Jalview.

* Jalview is free software: you can redistribute it and/or

* modify it under the terms of the GNU General Public License

* as published by the Free Software Foundation, either version 3

* of the License, or (at your option) any later version.

* Jalview is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty

* of MERCHANTABILITY or FITNESS FOR A PARTICULAR

* PURPOSE. See the GNU General Public License for more details.

* You should have received a copy of the GNU General Public License

* along with Jalview. If not, see <http://www.gnu.org/licenses/>.

* The Jalview Authors are detailed in the 'AUTHORS' file.

package jalview.analysis;

import java.awt.Color;

import java.util.ArrayList;

import java.util.Arrays;

import java.util.Collection;

import java.util.Collections;

import java.util.HashMap;

import java.util.HashSet;

import java.util.Iterator;

import java.util.LinkedHashMap;

import java.util.List;

import java.util.Locale;

import java.util.Map;

import java.util.Map.Entry;

import java.util.NoSuchElementException;

import java.util.Set;

import java.util.SortedMap;

import java.util.TreeMap;

import java.util.Vector;

import java.util.stream.Collectors;

import jalview.bin.Console;

import jalview.commands.RemoveGapColCommand;

import jalview.datamodel.AlignedCodon;

import jalview.datamodel.AlignedCodonFrame;

import jalview.datamodel.AlignedCodonFrame.SequenceToSequenceMapping;

import jalview.datamodel.Alignment;

import jalview.datamodel.AlignmentAnnotation;

import jalview.datamodel.AlignmentI;

import jalview.datamodel.Annotation;

import jalview.datamodel.ContactMatrixI;

import jalview.datamodel.DBRefEntry;

import jalview.datamodel.GeneLociI;

import jalview.datamodel.IncompleteCodonException;

import jalview.datamodel.Mapping;

import jalview.datamodel.PDBEntry;

import jalview.datamodel.Sequence;

import jalview.datamodel.SequenceFeature;

import jalview.datamodel.SequenceGroup;

import jalview.datamodel.SequenceI;

import jalview.datamodel.features.SequenceFeatures;

import jalview.io.gff.SequenceOntologyI;

import jalview.schemes.ResidueProperties;

import jalview.util.ColorUtils;

import jalview.util.Comparison;

import jalview.util.Constants;

import jalview.util.DBRefUtils;

import jalview.util.IntRangeComparator;

import jalview.util.MapList;

import jalview.util.MappingUtils;

/**

* grab bag of useful alignment manipulation operations Expect these to be

* refactored elsewhere at some point.

* @author jimp

public class AlignmentUtils

{

private static final int CODON_LENGTH = 3;

private static final String SEQUENCE_VARIANT = "sequence_variant:";

* the 'id' attribute is provided for variant features fetched from

* Ensembl using its REST service with JSON format

public static final String VARIANT_ID = "id";

/**

* A data model to hold the 'normal' base value at a position, and an optional

* sequence variant feature

static final class DnaVariant

{

final String base;

100

SequenceFeature variant;

101

102

DnaVariant(String nuc)

{

base = nuc;

variant = null;

}

DnaVariant(String nuc, SequenceFeature var)

{

base = nuc;

variant = var;

}

public String getSource()

115

{

116

return variant == null ? null : variant.getFeatureGroup();

}

/**

* toString for aid in the debugger only

121

122

@Override

123

public String toString()

124

{

125

return base + ":" + (variant == null ? "" : variant.getDescription());

}

}

/**

* given an existing alignment, create a new alignment including all, or up to

131

* flankSize additional symbols from each sequence's dataset sequence

* @param core

* @param flankSize

* @return AlignmentI

public static AlignmentI expandContext(AlignmentI core, int flankSize)

138

{

139

List<SequenceI> sq = new ArrayList<>();

140

int maxoffset = 0;

141

for (SequenceI s : core.getSequences())

142

{

143

131

SequenceI newSeq = s.deriveSequence();

144

131

final int newSeqStart = newSeq.getStart() - 1;

145

131

if (newSeqStart > maxoffset

146

&& newSeq.getDatasetSequence().getStart() < s.getStart())

147

{

148

131

maxoffset = newSeqStart;

149

}

150

131

sq.add(newSeq);

}

if (flankSize > -1)

{

maxoffset = Math.min(maxoffset, flankSize);

}

* now add offset left and right to create an expanded alignment

159

160

for (SequenceI s : sq)

161

{

162

131

SequenceI ds = s;

163

262

while (ds.getDatasetSequence() != null)

164

{

165

131

ds = ds.getDatasetSequence();

166

}

167

131

int s_end = s.findPosition(s.getStart() + s.getLength());

168

// find available flanking residues for sequence

169

131

int ustream_ds = s.getStart() - ds.getStart();

170

131

int dstream_ds = ds.getEnd() - s_end;

171

172

// build new flanked sequence

173

174

// compute gap padding to start of flanking sequence

175

131

int offset = maxoffset - ustream_ds;

176

177

// padding is gapChar x ( maxoffset - min(ustream_ds, flank)

178

131

if (flankSize >= 0)

179

{

180

125

if (flankSize < ustream_ds)

181

{

182

// take up to flankSize residues

183

offset = maxoffset - flankSize;

184

ustream_ds = flankSize;

185

}

186

125

if (flankSize <= dstream_ds)

187

{

188

116

dstream_ds = flankSize - 1;

189

}

190

}

191

// TODO use Character.toLowerCase to avoid creating String objects?

192

131

char[] upstream = new String(ds

193

.getSequence(s.getStart() - 1 - ustream_ds, s.getStart() - 1))

194

.toLowerCase(Locale.ROOT).toCharArray();

195

131

char[] downstream = new String(

196

ds.getSequence(s_end - 1, s_end + dstream_ds))

197

.toLowerCase(Locale.ROOT).toCharArray();

198

131

char[] coreseq = s.getSequence();

199

131

char[] nseq = new char[offset + upstream.length + downstream.length

200

+ coreseq.length];

201

131

char c = core.getGapCharacter();

202

203

131

int p = 0;

204

461

for (; p < offset; p++)

205

{

206

330

nseq[p] = c;

207

}

208

209

131

System.arraycopy(upstream, 0, nseq, p, upstream.length);

210

131

System.arraycopy(coreseq, 0, nseq, p + upstream.length,

211

coreseq.length);

212

131

System.arraycopy(downstream, 0, nseq,

213

p + coreseq.length + upstream.length, downstream.length);

214

131

s.setSequence(new String(nseq));

215

131

s.setStart(s.getStart() - ustream_ds);

216

131

s.setEnd(s_end + downstream.length);

217

}

218

AlignmentI newAl = new jalview.datamodel.Alignment(

219

sq.toArray(new SequenceI[0]));

220

for (SequenceI s : sq)

221

{

222

131

if (s.getAnnotation() != null)

223

{

224

for (AlignmentAnnotation aa : s.getAnnotation())

225

{

226

aa.adjustForAlignment(); // JAL-1712 fix

227

newAl.addAnnotation(aa);

}

}

}

newAl.setDataset(core.getDataset());

return newAl;

}

/**

* Returns the index (zero-based position) of a sequence in an alignment, or

* -1 if not found.

* @param al

* @param seq

* @return

59593

public static int getSequenceIndex(AlignmentI al, SequenceI seq)

244

{

245

59593

int result = -1;

246

59593

int pos = 0;

247

59593

for (SequenceI alSeq : al.getSequences())

248

{

249

126234233

if (alSeq == seq)

250

{

251

59535

result = pos;

252

59535

break;

253

}

254

126174698

pos++;

255

}

256

59593

return result;

}

/**

* Returns a map of lists of sequences in the alignment, keyed by sequence

261

* name. For use in mapping between different alignment views of the same

262

* sequences.

263

264

* @see jalview.datamodel.AlignmentI#getSequencesByName()

265

266

public static Map<String, List<SequenceI>> getSequencesByName(

267

AlignmentI al)

268

{

269

Map<String, List<SequenceI>> theMap = new LinkedHashMap<>();

270

for (SequenceI seq : al.getSequences())

271

{

272

String name = seq.getName();

273

if (name != null)

274

{

275

List<SequenceI> seqs = theMap.get(name);

276

if (seqs == null)

277

{

278

seqs = new ArrayList<>();

279

theMap.put(name, seqs);

}

seqs.add(seq);

}

}

return theMap;

}

/**

* Build mapping of protein to cDNA alignment. Mappings are made between

289

* sequences where the cDNA translates to the protein sequence. Any new

290

* mappings are added to the protein alignment. Returns true if any mappings

291

* either already exist or were added, else false.

292

293

* @param proteinAlignment

294

* @param cdnaAlignment

295

* @return

296

297

public static boolean mapProteinAlignmentToCdna(

298

final AlignmentI proteinAlignment, final AlignmentI cdnaAlignment)

299

{

300

if (proteinAlignment == null || cdnaAlignment == null)

{

return false;

}

Set<SequenceI> mappedDna = new HashSet<>();

306

Set<SequenceI> mappedProtein = new HashSet<>();

307

308

309

* First pass - map sequences where cross-references exist. This include

310

* 1-to-many mappings to support, for example, variant cDNA.

311

312

boolean mappingPerformed = mapProteinToCdna(proteinAlignment,

313

cdnaAlignment, mappedDna, mappedProtein, true);

314

315

316

* Second pass - map sequences where no cross-references exist. This only

317

* does 1-to-1 mappings and assumes corresponding sequences are in the same

318

* order in the alignments.

319

320

mappingPerformed |= mapProteinToCdna(proteinAlignment, cdnaAlignment,

321

mappedDna, mappedProtein, false);

322

return mappingPerformed;

}

/**

* Make mappings between compatible sequences (where the cDNA translation

327

* matches the protein).

328

329

* @param proteinAlignment

330

* @param cdnaAlignment

331

* @param mappedDna

332

* a set of mapped DNA sequences (to add to)

333

* @param mappedProtein

334

* a set of mapped Protein sequences (to add to)

335

* @param xrefsOnly

336

* if true, only map sequences where xrefs exist

337

* @return

338

339

protected static boolean mapProteinToCdna(

340

final AlignmentI proteinAlignment, final AlignmentI cdnaAlignment,

341

Set<SequenceI> mappedDna, Set<SequenceI> mappedProtein,

342

boolean xrefsOnly)

343

{

344

boolean mappingExistsOrAdded = false;

345

List<SequenceI> thisSeqs = proteinAlignment.getSequences();

346

for (SequenceI aaSeq : thisSeqs)

347

{

348

boolean proteinMapped = false;

349

AlignedCodonFrame acf = new AlignedCodonFrame();

350

351

for (SequenceI cdnaSeq : cdnaAlignment.getSequences())

352

{

353

354

* Always try to map if sequences have xref to each other; this supports

355

* variant cDNA or alternative splicing for a protein sequence.

356

357

* If no xrefs, try to map progressively, assuming that alignments have

358

* mappable sequences in corresponding order. These are not

359

* many-to-many, as that would risk mixing species with similar cDNA

360

* sequences.

361

362

if (xrefsOnly && !AlignmentUtils.haveCrossRef(aaSeq, cdnaSeq))

{

continue;

}

* Don't map non-xrefd sequences more than once each. This heuristic

369

* allows us to pair up similar sequences in ordered alignments.

370

371

if (!xrefsOnly && (mappedProtein.contains(aaSeq)

372

|| mappedDna.contains(cdnaSeq)))

{

continue;

}

if (mappingExists(proteinAlignment.getCodonFrames(),

377

aaSeq.getDatasetSequence(), cdnaSeq.getDatasetSequence()))

378

{

379

mappingExistsOrAdded = true;

}

else

{

MapList map = mapCdnaToProtein(aaSeq, cdnaSeq);

384

if (map != null)

385

{

386

acf.addMap(cdnaSeq, aaSeq, map);

387

mappingExistsOrAdded = true;

388

proteinMapped = true;

389

mappedDna.add(cdnaSeq);

390

mappedProtein.add(aaSeq);

}

}

}

if (proteinMapped)

{

proteinAlignment.addCodonFrame(acf);

397

}

398

}

399

return mappingExistsOrAdded;

}

/**

* Answers true if the mappings include one between the given (dataset)

404

* sequences.

405

406

protected static boolean mappingExists(List<AlignedCodonFrame> mappings,

407

SequenceI aaSeq, SequenceI cdnaSeq)

408

{

409

if (mappings != null)

410

{

411

for (AlignedCodonFrame acf : mappings)

412

{

413

if (cdnaSeq == acf.getDnaForAaSeq(aaSeq))

{

return true;

}

}

}

return false;

}

/**

* Builds a mapping (if possible) of a cDNA to a protein sequence.

424

* <ul>

425

* <li>first checks if the cdna translates exactly to the protein

426

* sequence</li>

427

* <li>else checks for translation after removing a STOP codon</li>

428

* <li>else checks for translation after removing a START codon</li>

429

* <li>if that fails, inspect CDS features on the cDNA sequence</li>

430

* </ul>

431

* Returns null if no mapping is determined.

432

433

* @param proteinSeq

434

* the aligned protein sequence

435

* @param cdnaSeq

436

* the aligned cdna sequence

437

* @return

438

439

public static MapList mapCdnaToProtein(SequenceI proteinSeq,

SequenceI cdnaSeq)

{

* Here we handle either dataset sequence set (desktop) or absent (applet).

444

* Use only the char[] form of the sequence to avoid creating possibly large

445

* String objects.

446

447

final SequenceI proteinDataset = proteinSeq.getDatasetSequence();

448

char[] aaSeqChars = proteinDataset != null

449

? proteinDataset.getSequence()

450

: proteinSeq.getSequence();

451

final SequenceI cdnaDataset = cdnaSeq.getDatasetSequence();

452

char[] cdnaSeqChars = cdnaDataset != null ? cdnaDataset.getSequence()

453

: cdnaSeq.getSequence();

454

if (aaSeqChars == null || cdnaSeqChars == null)

{

return null;

}

* cdnaStart/End, proteinStartEnd are base 1 (for dataset sequence mapping)

461

462

final int mappedLength = CODON_LENGTH * aaSeqChars.length;

463

int cdnaLength = cdnaSeqChars.length;

464

int cdnaStart = cdnaSeq.getStart();

465

int cdnaEnd = cdnaSeq.getEnd();

466

final int proteinStart = proteinSeq.getStart();

467

final int proteinEnd = proteinSeq.getEnd();

468

469

470

* If lengths don't match, try ignoring stop codon (if present)

471

472

if (cdnaLength != mappedLength && cdnaLength > 2)

473

{

474

String lastCodon = String.valueOf(cdnaSeqChars,

475

cdnaLength - CODON_LENGTH, CODON_LENGTH)

476

.toUpperCase(Locale.ROOT);

477

for (String stop : ResidueProperties.STOP_CODONS)

478

{

479

if (lastCodon.equals(stop))

480

{

481

cdnaEnd -= CODON_LENGTH;

482

cdnaLength -= CODON_LENGTH;

break;

}

}

}

* If lengths still don't match, try ignoring start codon.

490

491

int startOffset = 0;

492

if (cdnaLength != mappedLength && cdnaLength > 2

493

&& String.valueOf(cdnaSeqChars, 0, CODON_LENGTH)

494

.toUpperCase(Locale.ROOT)

495

.equals(ResidueProperties.START))

496

{

497

startOffset += CODON_LENGTH;

498

cdnaStart += CODON_LENGTH;

499

cdnaLength -= CODON_LENGTH;

500

}

501

502

if (translatesAs(cdnaSeqChars, startOffset, aaSeqChars))

503

{

504

505

* protein is translation of dna (+/- start/stop codons)

506

507

MapList map = new MapList(new int[] { cdnaStart, cdnaEnd },

508

new int[]

509

{ proteinStart, proteinEnd }, CODON_LENGTH, 1);

return map;

}

* translation failed - try mapping CDS annotated regions of dna

515

516

return mapCdsToProtein(cdnaSeq, proteinSeq);

}

/**

* Test whether the given cdna sequence, starting at the given offset,

521

* translates to the given amino acid sequence, using the standard translation

522

* table. Designed to fail fast i.e. as soon as a mismatch position is found.

523

524

* @param cdnaSeqChars

* @param cdnaStart

* @param aaSeqChars

* @return

protected static boolean translatesAs(char[] cdnaSeqChars, int cdnaStart,

530

char[] aaSeqChars)

531

{

532

if (cdnaSeqChars == null || aaSeqChars == null)

{

return false;

}

int aaPos = 0;

int dnaPos = cdnaStart;

539

161

for (; dnaPos < cdnaSeqChars.length - 2

540

&& aaPos < aaSeqChars.length; dnaPos += CODON_LENGTH, aaPos++)

541

{

542

130

String codon = String.valueOf(cdnaSeqChars, dnaPos, CODON_LENGTH);

543

130

final String translated = ResidueProperties.codonTranslate(codon);

544

545

546

* allow * in protein to match untranslatable in dna

547

548

130

final char aaRes = aaSeqChars[aaPos];

549

130

if ((translated == null || ResidueProperties.STOP.equals(translated))

&& aaRes == '*')

{

continue;

}

126

if (translated == null || !(aaRes == translated.charAt(0)))

555

{

556

// debug

557

// jalview.bin.Console.outPrintln(("Mismatch at " + i + "/" + aaResidue

558

// + ": "

559

// + codon + "(" + translated + ") != " + aaRes));

return false;

}

}

* check we matched all of the protein sequence

566

567

if (aaPos != aaSeqChars.length)

{

return false;

}

* check we matched all of the dna except

574

* for optional trailing STOP codon

575

576

if (dnaPos == cdnaSeqChars.length)

{

return true;

}

if (dnaPos == cdnaSeqChars.length - CODON_LENGTH)

581

{

582

String codon = String.valueOf(cdnaSeqChars, dnaPos, CODON_LENGTH);

583

if (ResidueProperties.STOP

584

.equals(ResidueProperties.codonTranslate(codon)))

{

return true;

}

}

return false;

}

/**

* Align sequence 'seq' to match the alignment of a mapped sequence. Note this

594

* currently assumes that we are aligning cDNA to match protein.

595

596

* @param seq

597

* the sequence to be realigned

598

* @param al

599

* the alignment whose sequence alignment is to be 'copied'

600

* @param gap

601

* character string represent a gap in the realigned sequence

602

* @param preserveUnmappedGaps

603

* @param preserveMappedGaps

604

* @return true if the sequence was realigned, false if it could not be

605

606

public static boolean alignSequenceAs(SequenceI seq, AlignmentI al,

607

String gap, boolean preserveMappedGaps,

608

boolean preserveUnmappedGaps)

609

{

610

611

* Get any mappings from the source alignment to the target (dataset)

612

* sequence.

613

614

// TODO there may be one AlignedCodonFrame per dataset sequence, or one with

615

// all mappings. Would it help to constrain this?

616

List<AlignedCodonFrame> mappings = al.getCodonFrame(seq);

617

if (mappings == null || mappings.isEmpty())

{

return false;

}

* Locate the aligned source sequence whose dataset sequence is mapped. We

624

* just take the first match here (as we can't align like more than one

625

* sequence).

626

627

SequenceI alignFrom = null;

628

AlignedCodonFrame mapping = null;

629

for (AlignedCodonFrame mp : mappings)

630

{

631

alignFrom = mp.findAlignedSequence(seq, al);

632

if (alignFrom != null)

{

mapping = mp;

break;

}

}

if (alignFrom == null)

{

return false;

}

alignSequenceAs(seq, alignFrom, mapping, gap, al.getGapCharacter(),

644

preserveMappedGaps, preserveUnmappedGaps);

return true;

}

/**

* Align sequence 'alignTo' the same way as 'alignFrom', using the mapping to

650

* match residues and codons. Flags control whether existing gaps in unmapped

651

* (intron) and mapped (exon) regions are preserved or not. Gaps between

652

* intron and exon are only retained if both flags are set.

* @param alignTo

* @param alignFrom

* @param mapping

* @param myGap

* @param sourceGap

* @param preserveUnmappedGaps

660

* @param preserveMappedGaps

661

662

public static void alignSequenceAs(SequenceI alignTo, SequenceI alignFrom,

663

AlignedCodonFrame mapping, String myGap, char sourceGap,

664

boolean preserveMappedGaps, boolean preserveUnmappedGaps)

665

{

666

// TODO generalise to work for Protein-Protein, dna-dna, dna-protein

667

668

// aligned and dataset sequence positions, all base zero

int thisSeqPos = 0;

int sourceDsPos = 0;

int basesWritten = 0;

673

char myGapChar = myGap.charAt(0);

674

int ratio = myGap.length();

675

676

int fromOffset = alignFrom.getStart() - 1;

677

int toOffset = alignTo.getStart() - 1;

678

int sourceGapMappedLength = 0;

679

boolean inExon = false;

680

final int toLength = alignTo.getLength();

681

final int fromLength = alignFrom.getLength();

682

StringBuilder thisAligned = new StringBuilder(2 * toLength);

683

684

685

* Traverse the 'model' aligned sequence

686

687

205

for (int i = 0; i < fromLength; i++)

688

{

689

186

char sourceChar = alignFrom.getCharAt(i);

690

186

if (sourceChar == sourceGap)

691

{

692

sourceGapMappedLength += ratio;

continue;

}

* Found a non-gap character. Locate its mapped region if any.

698

699

142

sourceDsPos++;

700

// Note mapping positions are base 1, our sequence positions base 0

701

142

int[] mappedPos = mapping.getMappedRegion(alignTo, alignFrom,

702

sourceDsPos + fromOffset);

703

142

if (mappedPos == null)

704

{

705

706

* unmapped position; treat like a gap

707

708

sourceGapMappedLength += ratio;

709

// jalview.bin.Console.errPrintln("Can't align: no codon mapping to

710

// residue "

711

// + sourceDsPos + "(" + sourceChar + ")");

// return;

continue;

}

int mappedCodonStart = mappedPos[0]; // position (1...) of codon start

717

int mappedCodonEnd = mappedPos[mappedPos.length - 1]; // codon end pos

718

StringBuilder trailingCopiedGap = new StringBuilder();

719

720

721

* Copy dna sequence up to and including this codon. Optionally, include

722

* gaps before the codon starts (in introns) and/or after the codon starts

723

* (in exons).

724

725

* Note this only works for 'linear' splicing, not reverse or interleaved.

726

* But then 'align dna as protein' doesn't make much sense otherwise.

727

728

int intronLength = 0;

729

294

while (basesWritten + toOffset < mappedCodonEnd

730

&& thisSeqPos < toLength)

731

{

732

246

final char c = alignTo.getCharAt(thisSeqPos++);

733

246

if (c != myGapChar)

734

{

735

146

basesWritten++;

736

146

int sourcePosition = basesWritten + toOffset;

737

146

if (sourcePosition < mappedCodonStart)

738

{

739

740

* Found an unmapped (intron) base. First add in any preceding gaps

741

* (if wanted).

742

743

if (preserveUnmappedGaps && trailingCopiedGap.length() > 0)

744

{

745

thisAligned.append(trailingCopiedGap.toString());

746

intronLength += trailingCopiedGap.length();

747

trailingCopiedGap = new StringBuilder();

}

intronLength++;

inExon = false;

}

else

{

final boolean startOfCodon = sourcePosition == mappedCodonStart;

755

int gapsToAdd = calculateGapsToInsert(preserveMappedGaps,

756

preserveUnmappedGaps, sourceGapMappedLength, inExon,

757

trailingCopiedGap.length(), intronLength, startOfCodon);

758

215

for (int k = 0; k < gapsToAdd; k++)

759

{

760

117

thisAligned.append(myGapChar);

761

}

762

sourceGapMappedLength = 0;

763

inExon = true;

764

}

765

146

thisAligned.append(c);

766

146

trailingCopiedGap = new StringBuilder();

}

else

{

100

if (inExon && preserveMappedGaps)

771

{

772

trailingCopiedGap.append(myGapChar);

773

}

774

else if (!inExon && preserveUnmappedGaps)

775

{

776

trailingCopiedGap.append(myGapChar);

}

}

}

}

* At end of model aligned sequence. Copy any remaining target sequence, optionally

784

* including (intron) gaps.

785

786

129

while (thisSeqPos < toLength)

787

{

788

110

final char c = alignTo.getCharAt(thisSeqPos++);

789

110

if (c != myGapChar || preserveUnmappedGaps)

790

{

791

102

thisAligned.append(c);

792

}

793

110

sourceGapMappedLength--;

}

* finally add gaps to pad for any trailing source gaps or

798

* unmapped characters

799

800

if (preserveUnmappedGaps)

801

{

802

while (sourceGapMappedLength > 0)

803

{

804

thisAligned.append(myGapChar);

805

sourceGapMappedLength--;

}

}

* All done aligning, set the aligned sequence.

811

812

alignTo.setSequence(new String(thisAligned));

}

/**

* Helper method to work out how many gaps to insert when realigning.

817

818

* @param preserveMappedGaps

819

* @param preserveUnmappedGaps

820

* @param sourceGapMappedLength

821

* @param inExon

822

* @param trailingCopiedGap

823

* @param intronLength

824

* @param startOfCodon

825

* @return

826

827

protected static int calculateGapsToInsert(boolean preserveMappedGaps,

828

boolean preserveUnmappedGaps, int sourceGapMappedLength,

829

boolean inExon, int trailingGapLength, int intronLength,

830

final boolean startOfCodon)

{

int gapsToAdd = 0;

if (startOfCodon)

{

* Reached start of codon. Ignore trailing gaps in intron unless we are

837

* preserving gaps in both exon and intron. Ignore them anyway if the

838

* protein alignment introduces a gap at least as large as the intronic

839

* region.

840

841

if (inExon && !preserveMappedGaps)

842

{

843

trailingGapLength = 0;

844

}

845

if (!inExon && !(preserveMappedGaps && preserveUnmappedGaps))

846

{

847

trailingGapLength = 0;

}

if (inExon)

{

gapsToAdd = Math.max(sourceGapMappedLength, trailingGapLength);

}

else

{

if (intronLength + trailingGapLength <= sourceGapMappedLength)

856

{

857

gapsToAdd = sourceGapMappedLength - intronLength;

}

else

{

gapsToAdd = Math.min(

862

intronLength + trailingGapLength - sourceGapMappedLength,

trailingGapLength);

}

}

}

else

{

* second or third base of codon; check for any gaps in dna

871

872

if (!preserveMappedGaps)

873

{

874

trailingGapLength = 0;

875

}

876

gapsToAdd = Math.max(sourceGapMappedLength, trailingGapLength);

}

return gapsToAdd;

}

/**

* Realigns the given protein to match the alignment of the dna, using codon

883

* mappings to translate aligned codon positions to protein residues.

884

885

* @param protein

886

* the alignment whose sequences are realigned by this method

887

* @param dna

888

* the dna alignment whose alignment we are 'copying'

889

* @return the number of sequences that were realigned

890

891

public static int alignProteinAsDna(AlignmentI protein, AlignmentI dna)

892

{

893

if (protein.isNucleotide() || !dna.isNucleotide())

894

{

895

jalview.bin.Console

896

.errPrintln("Wrong alignment type in alignProteinAsDna");

897

return 0;

898

}

899

List<SequenceI> unmappedProtein = new ArrayList<>();

900

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons = buildCodonColumnsMap(

901

protein, dna, unmappedProtein);

902

return alignProteinAs(protein, alignedCodons, unmappedProtein);

}

/**

* Realigns the given dna to match the alignment of the protein, using codon

907

* mappings to translate aligned peptide positions to codons.

908

909

* Always produces a padded CDS alignment.

910

911

* @param dna

912

* the alignment whose sequences are realigned by this method

913

* @param protein

914

* the protein alignment whose alignment we are 'copying'

915

* @return the number of sequences that were realigned

916

917

public static int alignCdsAsProtein(AlignmentI dna, AlignmentI protein)

918

{

919

if (protein.isNucleotide() || !dna.isNucleotide())

920

{

921

jalview.bin.Console

922

.errPrintln("Wrong alignment type in alignProteinAsDna");

923

return 0;

924

}

925

// todo: implement this

926

List<AlignedCodonFrame> mappings = protein.getCodonFrames();

927

int alignedCount = 0;

928

int width = 0; // alignment width for padding CDS

929

for (SequenceI dnaSeq : dna.getSequences())

930

{

931

if (alignCdsSequenceAsProtein(dnaSeq, protein, mappings,

932

dna.getGapCharacter()))

{

alignedCount++;

}

width = Math.max(dnaSeq.getLength(), width);

}

int oldwidth;

int diff;

for (SequenceI dnaSeq : dna.getSequences())

941

{

942

oldwidth = dnaSeq.getLength();

943

diff = width - oldwidth;

944

if (diff > 0)

945

{

946

dnaSeq.insertCharAt(oldwidth, diff, dna.getGapCharacter());

}

}

return alignedCount;

}

/**

* Helper method to align (if possible) the dna sequence to match the

954

* alignment of a mapped protein sequence. This is currently limited to

955

* handling coding sequence only.

* @param cdsSeq

* @param protein

* @param mappings

* @param gapChar

* @return

static boolean alignCdsSequenceAsProtein(SequenceI cdsSeq,

964

AlignmentI protein, List<AlignedCodonFrame> mappings,

965

char gapChar)

966

{

967

SequenceI cdsDss = cdsSeq.getDatasetSequence();

if (cdsDss == null)

{

System.err

.println("alignCdsSequenceAsProtein needs aligned sequence!");

return false;

}

List<AlignedCodonFrame> dnaMappings = MappingUtils

976

.findMappingsForSequence(cdsSeq, mappings);

977

for (AlignedCodonFrame mapping : dnaMappings)

978

{

979

SequenceI peptide = mapping.findAlignedSequence(cdsSeq, protein);

980

if (peptide != null)

981

{

982

final int peptideLength = peptide.getLength();

983

Mapping map = mapping.getMappingBetween(cdsSeq, peptide);

984

if (map != null)

985

{

986

MapList mapList = map.getMap();

987

if (map.getTo() == peptide.getDatasetSequence())

988

{

989

mapList = mapList.getInverse();

990

}

991

final int cdsLength = cdsDss.getLength();

992

int mappedFromLength = MappingUtils

993

.getLength(mapList.getFromRanges());

994

int mappedToLength = MappingUtils

995

.getLength(mapList.getToRanges());

996

boolean addStopCodon = (cdsLength == mappedFromLength

997

* CODON_LENGTH + CODON_LENGTH)

998

|| (peptide.getDatasetSequence()

999

.getLength() == mappedFromLength - 1);

1000

if (cdsLength != mappedToLength && !addStopCodon)

1001

{

1002

jalview.bin.Console.errPrintln(String.format(

1003

"Can't align cds as protein (length mismatch %d/%d): %s",

1004

cdsLength, mappedToLength, cdsSeq.getName()));

}

* pre-fill the aligned cds sequence with gaps

1009

1010

char[] alignedCds = new char[peptideLength * CODON_LENGTH

1011

+ (addStopCodon ? CODON_LENGTH : 0)];

1012

Arrays.fill(alignedCds, gapChar);

1013

1014

1015

* walk over the aligned peptide sequence and insert mapped

1016

* codons for residues in the aligned cds sequence

1017

1018

int copiedBases = 0;

1019

int cdsStart = cdsDss.getStart();

1020

int proteinPos = peptide.getStart() - 1;

1021

int cdsCol = 0;

1022

1023

for (int col = 0; col < peptideLength; col++)

1024

{

1025

char residue = peptide.getCharAt(col);

1026

1027

if (Comparison.isGap(residue))

1028

{

1029

cdsCol += CODON_LENGTH;

}

else

{

proteinPos++;

int[] codon = mapList.locateInTo(proteinPos, proteinPos);

1035

if (codon == null)

1036

{

1037

// e.g. incomplete start codon, X in peptide

1038

cdsCol += CODON_LENGTH;

}

else

{

for (int j = codon[0]; j <= codon[1]; j++)

1043

{

1044

char mappedBase = cdsDss.getCharAt(j - cdsStart);

1045

alignedCds[cdsCol++] = mappedBase;

copiedBases++;

}

}

}

}

* append stop codon if not mapped from protein,

1054

* closing it up to the end of the mapped sequence

1055

1056

if (copiedBases == cdsLength - CODON_LENGTH)

1057

{

1058

for (int i = alignedCds.length - 1; i >= 0; i--)

1059

{

1060

if (!Comparison.isGap(alignedCds[i]))

1061

{

1062

cdsCol = i + 1; // gap just after end of sequence

break;

}

}

for (int i = cdsLength - CODON_LENGTH; i < cdsLength; i++)

1067

{

1068

alignedCds[cdsCol++] = cdsDss.getCharAt(i);

1069

}

1070

}

1071

cdsSeq.setSequence(new String(alignedCds));

return true;

}

}

}

return false;

}

/**

* Builds a map whose key is an aligned codon position (3 alignment column

1081

* numbers base 0), and whose value is a map from protein sequence to each

1082

* protein's peptide residue for that codon. The map generates an ordering of

1083

* the codons, and allows us to read off the peptides at each position in

1084

* order to assemble 'aligned' protein sequences.

1085

1086

* @param protein

1087

* the protein alignment

1088

* @param dna

1089

* the coding dna alignment

1090

* @param unmappedProtein

1091

* any unmapped proteins are added to this list

1092

* @return

1093

1094

protected static Map<AlignedCodon, Map<SequenceI, AlignedCodon>> buildCodonColumnsMap(

1095

AlignmentI protein, AlignmentI dna,

1096

List<SequenceI> unmappedProtein)

1097

{

1098

1099

* maintain a list of any proteins with no mappings - these will be

1100

* rendered 'as is' in the protein alignment as we can't align them

1101

1102

unmappedProtein.addAll(protein.getSequences());

1103

1104

List<AlignedCodonFrame> mappings = protein.getCodonFrames();

1105

1106

1107

* Map will hold, for each aligned codon position e.g. [3, 5, 6], a map of

1108

* {dnaSequence, {proteinSequence, codonProduct}} at that position. The

1109

* comparator keeps the codon positions ordered.

1110

1111

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons = new TreeMap<>(

1112

new CodonComparator());

1113

1114

for (SequenceI dnaSeq : dna.getSequences())

1115

{

1116

for (AlignedCodonFrame mapping : mappings)

1117

{

1118

516

SequenceI prot = mapping.findAlignedSequence(dnaSeq, protein);

1119

516

if (prot != null)

1120

{

1121

Mapping seqMap = mapping.getMappingForSequence(dnaSeq);

1122

addCodonPositions(dnaSeq, prot, protein.getGapCharacter(), seqMap,

1123

alignedCodons);

1124

unmappedProtein.remove(prot);

}

}

}

* Finally add any unmapped peptide start residues (e.g. for incomplete

1131

* codons) as if at the codon position before the second residue

1132

1133

// TODO resolve JAL-2022 so this fudge can be removed

1134

int mappedSequenceCount = protein.getHeight() - unmappedProtein.size();

1135

addUnmappedPeptideStarts(alignedCodons, mappedSequenceCount);

1136

1137

return alignedCodons;

}

/**

* Scans for any protein mapped from position 2 (meaning unmapped start

1142

* position e.g. an incomplete codon), and synthesizes a 'codon' for it at the

1143

* preceding position in the alignment

1144

1145

* @param alignedCodons

1146

* the codon-to-peptide map

1147

* @param mappedSequenceCount

1148

* the number of distinct sequences in the map

1149

1150

protected static void addUnmappedPeptideStarts(

1151

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons,

1152

int mappedSequenceCount)

1153

{

1154

// TODO delete this ugly hack once JAL-2022 is resolved

1155

// i.e. we can model startPhase > 0 (incomplete start codon)

1156

1157

List<SequenceI> sequencesChecked = new ArrayList<>();

1158

AlignedCodon lastCodon = null;

1159

Map<SequenceI, AlignedCodon> toAdd = new HashMap<>();

1160

1161

for (Entry<AlignedCodon, Map<SequenceI, AlignedCodon>> entry : alignedCodons

1162

.entrySet())

1163

{

1164

1913

for (Entry<SequenceI, AlignedCodon> sequenceCodon : entry.getValue()

1165

.entrySet())

1166

{

1167

10669

SequenceI seq = sequenceCodon.getKey();

1168

10669

if (sequencesChecked.contains(seq))

1169

{

1170

10639

continue;

1171

}

1172

sequencesChecked.add(seq);

1173

AlignedCodon codon = sequenceCodon.getValue();

1174

if (codon.peptideCol > 1)

1175

{

1176

jalview.bin.Console.errPrintln(

1177

"Problem mapping protein with >1 unmapped start positions: "

1178

+ seq.getName());

1179

}

1180

else if (codon.peptideCol == 1)

1181

{

1182

1183

* first position (peptideCol == 0) was unmapped - add it

1184

1185

if (lastCodon != null)

1186

{

1187

AlignedCodon firstPeptide = new AlignedCodon(lastCodon.pos1,

1188

lastCodon.pos2, lastCodon.pos3,

1189

String.valueOf(seq.getCharAt(0)), 0);

1190

toAdd.put(seq, firstPeptide);

}

else

{

* unmapped residue at start of alignment (no prior column) -

1196

* 'insert' at nominal codon [0, 0, 0]

1197

1198

AlignedCodon firstPeptide = new AlignedCodon(0, 0, 0,

1199

String.valueOf(seq.getCharAt(0)), 0);

1200

toAdd.put(seq, firstPeptide);

1201

}

1202

}

1203

if (sequencesChecked.size() == mappedSequenceCount)

1204

{

1205

// no need to check past first mapped position in all sequences

break;

}

}

1913

lastCodon = entry.getKey();

}

* add any new codons safely after iterating over the map

1214

1215

for (Entry<SequenceI, AlignedCodon> startCodon : toAdd.entrySet())

1216

{

1217

addCodonToMap(alignedCodons, startCodon.getValue(),

1218

startCodon.getKey());

}

}

/**

* Update the aligned protein sequences to match the codon alignments given in

* the map.

* @param protein

* @param alignedCodons

1228

* an ordered map of codon positions (columns), with sequence/peptide

1229

* values present in each column

1230

* @param unmappedProtein

1231

* @return

1232

1233

protected static int alignProteinAs(AlignmentI protein,

1234

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons,

1235

List<SequenceI> unmappedProtein)

1236

{

1237

1238

* prefill peptide sequences with gaps

1239

1240

int alignedWidth = alignedCodons.size();

1241

char[] gaps = new char[alignedWidth];

1242

Arrays.fill(gaps, protein.getGapCharacter());

1243

Map<SequenceI, char[]> peptides = new HashMap<>();

1244

for (SequenceI seq : protein.getSequences())

1245

{

1246

if (!unmappedProtein.contains(seq))

1247

{

1248

peptides.put(seq, Arrays.copyOf(gaps, gaps.length));

}

}

* Traverse the codons left to right (as defined by CodonComparator)

1254

* and insert peptides in each column where the sequence is mapped.

1255

* This gives a peptide 'alignment' where residues are aligned if their

1256

* corresponding codons occupy the same columns in the cdna alignment.

1257

1258

int column = 0;

1259

for (AlignedCodon codon : alignedCodons.keySet())

1260

{

1261

1914

final Map<SequenceI, AlignedCodon> columnResidues = alignedCodons

1262

.get(codon);

1263

1914

for (Entry<SequenceI, AlignedCodon> entry : columnResidues.entrySet())

1264

{

1265

10682

char residue = entry.getValue().product.charAt(0);

1266

10682

peptides.get(entry.getKey())[column] = residue;

1267

}

1268

1914

column++;

}

* and finally set the constructed sequences

1273

1274

for (Entry<SequenceI, char[]> entry : peptides.entrySet())

1275

{

1276

entry.getKey().setSequence(new String(entry.getValue()));

}

return 0;

}

/**

* Populate the map of aligned codons by traversing the given sequence

1284

* mapping, locating the aligned positions of mapped codons, and adding those

1285

* positions and their translation products to the map.

1286

1287

* @param dna

1288

* the aligned sequence we are mapping from

1289

* @param protein

1290

* the sequence to be aligned to the codons

1291

* @param gapChar

1292

* the gap character in the dna sequence

1293

* @param seqMap

1294

* a mapping to a sequence translation

1295

* @param alignedCodons

1296

* the map we are building up

1297

1298

static void addCodonPositions(SequenceI dna, SequenceI protein,

1299

char gapChar, Mapping seqMap,

1300

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons)

1301

{

1302

Iterator<AlignedCodon> codons = seqMap.getCodonIterator(dna, gapChar);

1303

1304

1305

* add codon positions, and their peptide translations, to the alignment

1306

* map, while remembering the first codon mapped

1307

1308

10716

while (codons.hasNext())

1309

{

1310

10684

try

1311

{

1312

10684

AlignedCodon codon = codons.next();

1313

10684

addCodonToMap(alignedCodons, codon, protein);

1314

} catch (IncompleteCodonException e)

1315

{

1316

// possible incomplete trailing codon - ignore

1317

} catch (NoSuchElementException e)

1318

{

1319

// possibly peptide lacking STOP

}

}

}

/**

* Helper method to add a codon-to-peptide entry to the aligned codons map

1326

1327

* @param alignedCodons

* @param codon

* @param protein

10690

protected static void addCodonToMap(

1332

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons,

1333

AlignedCodon codon, SequenceI protein)

1334

{

1335

10690

Map<SequenceI, AlignedCodon> seqProduct = alignedCodons.get(codon);

1336

10690

if (seqProduct == null)

1337

{

1338

1914

seqProduct = new HashMap<>();

1339

1914

alignedCodons.put(codon, seqProduct);

1340

}

1341

10690

seqProduct.put(protein, codon);

}

/**

* Returns true if a cDNA/Protein mapping either exists, or could be made,

1346

* between at least one pair of sequences in the two alignments. Currently,

1347

* the logic is:

1348

* <ul>

1349

* <li>One alignment must be nucleotide, and the other protein</li>

1350

* <li>At least one pair of sequences must be already mapped, or mappable</li>

1351

* <li>Mappable means the nucleotide translation matches the protein

1352

* sequence</li>

1353

* <li>The translation may ignore start and stop codons if present in the

* nucleotide</li>

* </ul>

* @param al1

* @param al2

* @return

public static boolean isMappable(AlignmentI al1, AlignmentI al2)

1362

{

1363

if (al1 == null || al2 == null)

{

return false;

}

* Require one nucleotide and one protein

1370

1371

if (al1.isNucleotide() == al2.isNucleotide())

{

return false;

}

AlignmentI dna = al1.isNucleotide() ? al1 : al2;

1376

AlignmentI protein = dna == al1 ? al2 : al1;

1377

List<AlignedCodonFrame> mappings = protein.getCodonFrames();

1378

for (SequenceI dnaSeq : dna.getSequences())

1379

{

1380

for (SequenceI proteinSeq : protein.getSequences())

1381

{

1382

if (isMappable(dnaSeq, proteinSeq, mappings))

{

return true;

}

}

}

return false;

}

/**

* Returns true if the dna sequence is mapped, or could be mapped, to the

* protein sequence.

* @param dnaSeq

* @param proteinSeq

* @param mappings

* @return

protected static boolean isMappable(SequenceI dnaSeq,

1401

SequenceI proteinSeq, List<AlignedCodonFrame> mappings)

1402

{

1403

if (dnaSeq == null || proteinSeq == null)

{

return false;

}

SequenceI dnaDs = dnaSeq.getDatasetSequence() == null ? dnaSeq

1409

: dnaSeq.getDatasetSequence();

1410

SequenceI proteinDs = proteinSeq.getDatasetSequence() == null

1411

? proteinSeq

1412

: proteinSeq.getDatasetSequence();

1413

1414

for (AlignedCodonFrame mapping : mappings)

1415

{

1416

if (proteinDs == mapping.getAaForDnaSeq(dnaDs))

{

* already mapped

return true;

}

}

* Just try to make a mapping (it is not yet stored), test whether

1427

* successful.

1428

1429

return mapCdnaToProtein(proteinDs, dnaDs) != null;

}

/**

* Finds any reference annotations associated with the sequences in

1434

* sequenceScope, that are not already added to the alignment, and adds them

1435

* to the 'candidates' map. Also populates a lookup table of annotation

1436

* labels, keyed by calcId, for use in constructing tooltips or the like.

1437

1438

* @param sequenceScope

1439

* the sequences to scan for reference annotations

1440

* @param labelForCalcId

1441

* (optional) map to populate with label for calcId

1442

* @param candidates

1443

* map to populate with annotations for sequence

1444

* @param al

1445

* the alignment to check for presence of annotations

1446

1447

public static void findAddableReferenceAnnotations(

1448

List<SequenceI> sequenceScope, Map<String, String> labelForCalcId,

1449

final Map<SequenceI, List<AlignmentAnnotation>> candidates,

1450

AlignmentI al)

1451

{

1452

if (sequenceScope == null)

{

return;

}

* For each sequence in scope, make a list of any annotations on the

1459

* underlying dataset sequence which are not already on the alignment.

1460

1461

* Add to a map of { alignmentSequence, <List of annotations to add> }

1462

1463

for (SequenceI seq : sequenceScope)

1464

{

1465

SequenceI dataset = seq.getDatasetSequence();

if (dataset == null)

{

continue;

}

AlignmentAnnotation[] datasetAnnotations = dataset.getAnnotation();

1471

if (datasetAnnotations == null)

{

continue;

}

final List<AlignmentAnnotation> result = new ArrayList<>();

1476

for (AlignmentAnnotation dsann : datasetAnnotations)

1477

{

1478

1479

* Find matching annotations on the alignment. If none is found, then

1480

* add this annotation to the list of 'addable' annotations for this

1481

* sequence.

1482

1483

155

final Iterable<AlignmentAnnotation> matchedAlignmentAnnotations = al

1484

.findAnnotations(seq, dsann.getCalcId(), dsann.label);

1485

155

boolean found = false;

1486

155

if (matchedAlignmentAnnotations != null)

1487

{

1488

152

for (AlignmentAnnotation matched : matchedAlignmentAnnotations)

1489

{

1490

135

if (dsann.description.equals(matched.description))

{

found = true;

break;

}

}

}

155

if (!found)

1498

{

1499

101

result.add(dsann);

1500

101

if (labelForCalcId != null)

1501

{

1502

labelForCalcId.put(dsann.getCalcId(), dsann.label);

}

}

}

* Save any addable annotations for this sequence

1508

1509

if (!result.isEmpty())

1510

{

1511

candidates.put(seq, result);

}

}

}

/**

* Adds annotations to the top of the alignment annotations, in the same order

1518

* as their related sequences. If you already have an annotation and want to

1519

* add it to a sequence in an alignment use {@code addReferenceAnnotationTo}

1520

1521

* @param annotations

1522

* the annotations to add

1523

* @param alignment

1524

* the alignment to add them to

1525

* @param selectionGroup

1526

* current selection group - may be null, if provided then any added

1527

* annotation will be trimmed to just those columns in the selection

1528

* group

1529

1530

public static void addReferenceAnnotations(

1531

Map<SequenceI, List<AlignmentAnnotation>> annotations,

1532

final AlignmentI alignment, final SequenceGroup selectionGroup)

1533

{

1534

for (SequenceI seq : annotations.keySet())

1535

{

1536

for (AlignmentAnnotation ann : annotations.get(seq))

1537

{

1538

addReferenceAnnotationTo(alignment, seq, ann, selectionGroup);

}

}

}

public static boolean isSSAnnotationPresent(

1544

Map<SequenceI, List<AlignmentAnnotation>> annotations)

1545

{

1546

1547

for (SequenceI seq : annotations.keySet())

1548

{

1549

if (isSecondaryStructurePresent(

1550

annotations.get(seq).toArray(new AlignmentAnnotation[0])))

{

return true;

}

}

return false;

}

/**

* Make a copy of a reference annotation {@code ann} and add it to an

1560

* alignment sequence {@code seq} in {@code alignment}, optionally limited to

1561

* the extent of {@code selectionGroup}

* @param alignment

* @param seq

* @param ann

* @param selectionGroup

1567

* current selection group - may be null, if provided then any added

1568

* annotation will be trimmed to just those columns in the selection

1569

* group

1570

* @return annotation added to {@code seq and {@code alignment}

1571

1572

public static AlignmentAnnotation addReferenceAnnotationTo(

1573

final AlignmentI alignment, final SequenceI seq,

1574

final AlignmentAnnotation ann, final SequenceGroup selectionGroup)

1575

{

1576

AlignmentAnnotation copyAnn = new AlignmentAnnotation(ann);

1577

int startRes = 0;

1578

int endRes = ann.annotations.length;

1579

if (selectionGroup != null)

1580

{

1581

startRes = -1 + Math.min(seq.getEnd(), Math.max(seq.getStart(),

1582

seq.findPosition(selectionGroup.getStartRes())));

1583

endRes = -1 + Math.min(seq.getEnd(),

1584

seq.findPosition(selectionGroup.getEndRes()));

1585

1586

}

1587

copyAnn.restrict(startRes, endRes + 0);

1588

1589

1590

* Add to the sequence (sets copyAnn.datasetSequence), unless the

1591

* original annotation is already on the sequence.

1592

1593

if (!seq.hasAnnotation(ann))

1594

{

1595

ContactMatrixI cm = seq.getDatasetSequence().getContactMatrixFor(ann);

1596

if (cm != null)

1597

{

1598

seq.addContactListFor(copyAnn, cm);

1599

}

1600

seq.addAlignmentAnnotation(copyAnn);

1601

}

1602

// adjust for gaps

1603

copyAnn.adjustForAlignment();

1604

// add to the alignment and set visible

1605

alignment.addAnnotation(copyAnn);

1606

copyAnn.visible = true;

return copyAnn;

}

/**

* Set visibility of alignment annotations of specified types (labels), for

1613

* specified sequences. This supports controls like "Show all secondary

1614

* structure", "Hide all Temp factor", etc.

1615

1616

* @al the alignment to scan for annotations

1617

* @param types

1618

* the types (labels) of annotations to be updated

1619

* @param forSequences

1620

* if not null, only annotations linked to one of these sequences are

1621

* in scope for update; if null, acts on all sequence annotations

1622

* @param anyType

1623

* if this flag is true, 'types' is ignored (label not checked)

1624

* @param doShow

1625

* if true, set visibility on, else set off

1626

1627

public static void showOrHideSequenceAnnotations(AlignmentI al,

1628

Collection<String> types, List<SequenceI> forSequences,

1629

boolean anyType, boolean doShow)

1630

{

1631

AlignmentAnnotation[] anns = al.getAlignmentAnnotation();

1632

if (anns != null)

1633

{

1634

for (AlignmentAnnotation aa : anns)

1635

{

1636

if (anyType || types.contains(aa.label))

1637

{

1638

if ((aa.sequenceRef != null) && (forSequences == null

1639

|| forSequences.contains(aa.sequenceRef)))

{

aa.visible = doShow;

}

}

}

}

}

/**

* Shows or hides auto calculated annotations for a sequence group.

1650

1651

* @param al

1652

* The alignment object with the annotations.

1653

* @param type

1654

* The type of annotation to show or hide.

1655

* @param selectedGroup

1656

* The sequence group for which the annotations should be shown or

1657

* hidden.

1658

* @param anyType

1659

* If true, all types of annotations will be shown/hidden.

1660

* @param doShow

1661

* If true, the annotations will be shown; if false, annotations will

1662

* be hidden.

1663

1664

public static void showOrHideAutoCalculatedAnnotationsForGroup(

1665

AlignmentI al, String type, SequenceGroup selectedGroup,

1666

boolean anyType, boolean doShow)

1667

{

1668

// Get all alignment annotations

1669

AlignmentAnnotation[] anns = al.getAlignmentAnnotation();

if (anns != null)

{

for (AlignmentAnnotation aa : anns)

1674

{

1675

// Check if anyType is true or if the annotation's label contains the

1676

// specified type (currently for secondary structure consensus)

1677

if ((anyType && aa.label

1678

.startsWith(Constants.SECONDARY_STRUCTURE_CONSENSUS_LABEL))

1679

|| aa.label.startsWith(type))

1680

{

1681

// If the annotation's group reference is not null and matches the

1682

// selected group, update its visibility.

1683

if (aa.groupRef != null && selectedGroup == aa.groupRef)

{

aa.visible = doShow;

}

}

}

}

}

public static AlignmentAnnotation getFirstSequenceAnnotationOfType(

1693

AlignmentI al, int graphType)

1694

{

1695

AlignmentAnnotation[] anns = al.getAlignmentAnnotation();

1696

if (anns != null)

1697

{

1698

for (AlignmentAnnotation aa : anns)

1699

{

1700

if (aa.sequenceRef != null && aa.graph == graphType)

return aa;

}

}

return null;

}

/**

* Returns true if either sequence has a cross-reference to the other

* @param seq1

* @param seq2

* @return

public static boolean haveCrossRef(SequenceI seq1, SequenceI seq2)

1715

{

1716

// Note: moved here from class CrossRef as the latter class has dependencies

1717

// not availability to the applet's classpath

1718

return hasCrossRef(seq1, seq2) || hasCrossRef(seq2, seq1);

}

/**

* Returns true if seq1 has a cross-reference to seq2. Currently this assumes

1723

* that sequence name is structured as Source|AccessionId.

* @param seq1

* @param seq2

* @return

108

public static boolean hasCrossRef(SequenceI seq1, SequenceI seq2)

1730

{

1731

108

if (seq1 == null || seq2 == null)

{

return false;

}

100

String name = seq2.getName();

1736

100

final List<DBRefEntry> xrefs = seq1.getDBRefs();

1737

100

if (xrefs != null)

1738

{

1739

for (int ix = 0, nx = xrefs.size(); ix < nx; ix++)

1740

{

1741

DBRefEntry xref = xrefs.get(ix);

1742

String xrefName = xref.getSource() + "|" + xref.getAccessionId();

1743

// case-insensitive test, consistent with DBRefEntry.equalRef()

1744

if (xrefName.equalsIgnoreCase(name))

{

return true;

}

}

}

return false;

}

/**

* Constructs an alignment consisting of the mapped (CDS) regions in the given

1755

* nucleotide sequences, and updates mappings to match. The CDS sequences are

1756

* added to the original alignment's dataset, which is shared by the new

1757

* alignment. Mappings from nucleotide to CDS, and from CDS to protein, are

1758

* added to the alignment dataset.

1759

1760

* @param dna

1761

* aligned nucleotide (dna or cds) sequences

1762

* @param dataset

1763

* the alignment dataset the sequences belong to

1764

* @param products

1765

* (optional) to restrict results to CDS that map to specified

1766

* protein products

1767

* @return an alignment whose sequences are the cds-only parts of the dna

1768

* sequences (or null if no mappings are found)

1769

1770

public static AlignmentI makeCdsAlignment(SequenceI[] dna,

1771

AlignmentI dataset, SequenceI[] products)

1772

{

1773

if (dataset == null || dataset.getDataset() != null)

1774

{

1775

throw new IllegalArgumentException(

1776

"IMPLEMENTATION ERROR: dataset.getDataset() must be null!");

1777

}

1778

List<SequenceI> foundSeqs = new ArrayList<>();

1779

List<SequenceI> cdsSeqs = new ArrayList<>();

1780

List<AlignedCodonFrame> mappings = dataset.getCodonFrames();

1781

HashSet<SequenceI> productSeqs = null;

1782

if (products != null)

1783

{

1784

productSeqs = new HashSet<>();

1785

for (SequenceI seq : products)

1786

{

1787

productSeqs.add(seq.getDatasetSequence() == null ? seq

1788

: seq.getDatasetSequence());

}

}

* Construct CDS sequences from mappings on the alignment dataset.

1794

* The logic is:

1795

* - find the protein product(s) mapped to from each dna sequence

1796

* - if the mapping covers the whole dna sequence (give or take start/stop

1797

* codon), take the dna as the CDS sequence

1798

* - else search dataset mappings for a suitable dna sequence, i.e. one

1799

* whose whole sequence is mapped to the protein

1800

* - if no sequence found, construct one from the dna sequence and mapping

1801

* (and add it to dataset so it is found if this is repeated)

1802

1803

for (SequenceI dnaSeq : dna)

1804

{

1805

SequenceI dnaDss = dnaSeq.getDatasetSequence() == null ? dnaSeq

1806

: dnaSeq.getDatasetSequence();

1807

1808

List<AlignedCodonFrame> seqMappings = MappingUtils

1809

.findMappingsForSequence(dnaSeq, mappings);

1810

for (AlignedCodonFrame mapping : seqMappings)

1811

{

1812

List<Mapping> mappingsFromSequence = mapping

1813

.getMappingsFromSequence(dnaSeq);

1814

1815

for (Mapping aMapping : mappingsFromSequence)

1816

{

1817

MapList mapList = aMapping.getMap();

1818

if (mapList.getFromRatio() == 1)

1819

{

1820

1821

* not a dna-to-protein mapping (likely dna-to-cds)

continue;

}

* skip if mapping is not to one of the target set of proteins

1828

1829

SequenceI proteinProduct = aMapping.getTo();

1830

if (productSeqs != null && !productSeqs.contains(proteinProduct))

{

continue;

}

* try to locate the CDS from the dataset mappings;

1837

* guard against duplicate results (for the case that protein has

1838

* dbrefs to both dna and cds sequences)

1839

1840

SequenceI cdsSeq = findCdsForProtein(mappings, dnaSeq,

1841

seqMappings, aMapping);

1842

if (cdsSeq != null)

1843

{

1844

if (!foundSeqs.contains(cdsSeq))

1845

{

1846

foundSeqs.add(cdsSeq);

1847

SequenceI derivedSequence = cdsSeq.deriveSequence();

1848

cdsSeqs.add(derivedSequence);

1849

if (!dataset.getSequences().contains(cdsSeq))

1850

{

1851

dataset.addSequence(cdsSeq);

}

}

continue;

}

* didn't find mapped CDS sequence - construct it and add

1859

* its dataset sequence to the dataset

1860

1861

cdsSeq = makeCdsSequence(dnaSeq.getDatasetSequence(), aMapping,

1862

dataset).deriveSequence();

1863

// cdsSeq has a name constructed as CDS|<dbref>

1864

// <dbref> will be either the accession for the coding sequence,

1865

// marked in the /via/ dbref to the protein product accession

1866

// or it will be the original nucleotide accession.

1867

SequenceI cdsSeqDss = cdsSeq.getDatasetSequence();

cdsSeqs.add(cdsSeq);

* build the mapping from CDS to protein

1873

1874

List<int[]> cdsRange = Collections

1875

.singletonList(new int[]

1876

{ cdsSeq.getStart(),

1877

cdsSeq.getLength() + cdsSeq.getStart() - 1 });

1878

MapList cdsToProteinMap = new MapList(cdsRange,

1879

mapList.getToRanges(), mapList.getFromRatio(),

1880

mapList.getToRatio());

1881

1882

if (!dataset.getSequences().contains(cdsSeqDss))

1883

{

1884

1885

* if this sequence is a newly created one, add it to the dataset

1886

* and made a CDS to protein mapping (if sequence already exists,

1887

* CDS-to-protein mapping _is_ the transcript-to-protein mapping)

1888

1889

dataset.addSequence(cdsSeqDss);

1890

AlignedCodonFrame cdsToProteinMapping = new AlignedCodonFrame();

1891

cdsToProteinMapping.addMap(cdsSeqDss, proteinProduct,

cdsToProteinMap);

* guard against duplicating the mapping if repeating this action

1896

1897

if (!mappings.contains(cdsToProteinMapping))

1898

{

1899

mappings.add(cdsToProteinMapping);

}

}

propagateDBRefsToCDS(cdsSeqDss, dnaSeq.getDatasetSequence(),

1904

proteinProduct, aMapping);

1905

1906

* add another mapping from original 'from' range to CDS

1907

1908

AlignedCodonFrame dnaToCdsMapping = new AlignedCodonFrame();

1909

final MapList dnaToCdsMap = new MapList(mapList.getFromRanges(),

1910

cdsRange, 1, 1);

1911

dnaToCdsMapping.addMap(dnaSeq.getDatasetSequence(), cdsSeqDss,

1912

dnaToCdsMap);

1913

if (!mappings.contains(dnaToCdsMapping))

1914

{

1915

mappings.add(dnaToCdsMapping);

}

* transfer dna chromosomal loci (if known) to the CDS

1920

* sequence (via the mapping)

1921

1922

final MapList cdsToDnaMap = dnaToCdsMap.getInverse();

1923

transferGeneLoci(dnaSeq, cdsToDnaMap, cdsSeq);

1924

1925

1926

* add DBRef with mapping from protein to CDS

1927

* (this enables Get Cross-References from protein alignment)

1928

* This is tricky because we can't have two DBRefs with the

1929

* same source and accession, so need a different accession for

1930

* the CDS from the dna sequence

1931

1932

1933

// specific use case:

1934

// Genomic contig ENSCHR:1, contains coding regions for ENSG01,

1935

// ENSG02, ENSG03, with transcripts and products similarly named.

1936

// cannot add distinct dbrefs mapping location on ENSCHR:1 to ENSG01

1937

1938

// JBPNote: ?? can't actually create an example that demonstrates we

1939

// need to

1940

// synthesize an xref.

1941

1942

List<DBRefEntry> primrefs = dnaDss.getPrimaryDBRefs();

1943

for (int ip = 0, np = primrefs.size(); ip < np; ip++)

1944

{

1945

DBRefEntry primRef = primrefs.get(ip);

1946

1947

* create a cross-reference from CDS to the source sequence's

1948

* primary reference and vice versa

1949

1950

String source = primRef.getSource();

1951

String version = primRef.getVersion();

1952

DBRefEntry cdsCrossRef = new DBRefEntry(source,

1953

source + ":" + version, primRef.getAccessionId());

1954

cdsCrossRef

1955

.setMap(new Mapping(dnaDss, new MapList(cdsToDnaMap)));

1956

cdsSeqDss.addDBRef(cdsCrossRef);

1957

1958

dnaSeq.addDBRef(new DBRefEntry(source, version,

1959

cdsSeq.getName(), new Mapping(cdsSeqDss, dnaToCdsMap)));

1960

// problem here is that the cross-reference is synthesized -

1961

// cdsSeq.getName() may be like 'CDS|dnaaccession' or

1962

// 'CDS|emblcdsacc'

1963

// assuming cds version same as dna ?!?

1964

1965

DBRefEntry proteinToCdsRef = new DBRefEntry(source, version,

1966

cdsSeq.getName());

1967

1968

proteinToCdsRef.setMap(

1969

new Mapping(cdsSeqDss, cdsToProteinMap.getInverse()));

1970

proteinProduct.addDBRef(proteinToCdsRef);

1971

}

1972

1973

* transfer any features on dna that overlap the CDS

1974

1975

transferFeatures(dnaSeq, cdsSeq, dnaToCdsMap, null,

1976

SequenceOntologyI.CDS);

}

}

}

AlignmentI cds = new Alignment(

1982

cdsSeqs.toArray(new SequenceI[cdsSeqs.size()]));

1983

cds.setDataset(dataset);

return cds;

}

/**

* Tries to transfer gene loci (dbref to chromosome positions) from fromSeq to

1990

* toSeq, mediated by the given mapping between the sequences

1991

1992

* @param fromSeq

1993

* @param targetToFrom

* Map

* @param targetSeq

protected static void transferGeneLoci(SequenceI fromSeq,

1998

MapList targetToFrom, SequenceI targetSeq)

1999

{

2000

if (targetSeq.getGeneLoci() != null)

2001

{

2002

// already have - don't override

2003

return;

2004

}

2005

GeneLociI fromLoci = fromSeq.getGeneLoci();

2006

if (fromLoci == null)

{

return;

}

MapList newMap = targetToFrom.traverse(fromLoci.getMapping());

if (newMap != null)

{

targetSeq.setGeneLoci(fromLoci.getSpeciesId(),

2016

fromLoci.getAssemblyId(), fromLoci.getChromosomeId(), newMap);

}

}

/**

* A helper method that finds a CDS sequence in the alignment dataset that is

2022

* mapped to the given protein sequence, and either is, or has a mapping from,

2023

* the given dna sequence.

2024

2025

* @param mappings

2026

* set of all mappings on the dataset

2027

* @param dnaSeq

2028

* a dna (or cds) sequence we are searching from

2029

* @param seqMappings

2030

* the set of mappings involving dnaSeq

2031

* @param aMapping

2032

* a transcript-to-peptide mapping

2033

* @return

2034

2035

static SequenceI findCdsForProtein(List<AlignedCodonFrame> mappings,

2036

SequenceI dnaSeq, List<AlignedCodonFrame> seqMappings,

Mapping aMapping)

{

* TODO a better dna-cds-protein mapping data representation to allow easy

2041

* navigation; until then this clunky looping around lists of mappings

2042

2043

SequenceI seqDss = dnaSeq.getDatasetSequence() == null ? dnaSeq

2044

: dnaSeq.getDatasetSequence();

2045

SequenceI proteinProduct = aMapping.getTo();

2046

2047

2048

* is this mapping from the whole dna sequence (i.e. CDS)?

2049

* allowing for possible stop codon on dna but not peptide

2050

2051

int mappedFromLength = MappingUtils

2052

.getLength(aMapping.getMap().getFromRanges());

2053

int dnaLength = seqDss.getLength();

2054

if (mappedFromLength == dnaLength

2055

|| mappedFromLength == dnaLength - CODON_LENGTH)

2056

{

2057

2058

* if sequence has CDS features, this is a transcript with no UTR

2059

* - do not take this as the CDS sequence! (JAL-2789)

2060

2061

if (seqDss.getFeatures().getFeaturesByOntology(SequenceOntologyI.CDS)

.isEmpty())

{

return seqDss;

}

}

* looks like we found the dna-to-protein mapping; search for the

2070

* corresponding cds-to-protein mapping

2071

2072

List<AlignedCodonFrame> mappingsToPeptide = MappingUtils

2073

.findMappingsForSequence(proteinProduct, mappings);

2074

for (AlignedCodonFrame acf : mappingsToPeptide)

2075

{

2076

for (SequenceToSequenceMapping map : acf.getMappings())

2077

{

2078

276

Mapping mapping = map.getMapping();

2079

276

if (mapping != aMapping

2080

&& mapping.getMap().getFromRatio() == CODON_LENGTH

2081

&& proteinProduct == mapping.getTo()

2082

&& seqDss != map.getFromSeq())

2083

{

2084

mappedFromLength = MappingUtils

2085

.getLength(mapping.getMap().getFromRanges());

2086

if (mappedFromLength == map.getFromSeq().getLength())

2087

{

2088

2089

* found a 3:1 mapping to the protein product which covers

2090

* the whole dna sequence i.e. is from CDS; finally check the CDS

2091

* is mapped from the given dna start sequence

2092

2093

SequenceI cdsSeq = map.getFromSeq();

2094

// todo this test is weak if seqMappings contains multiple mappings;

2095

// we get away with it if transcript:cds relationship is 1:1

2096

List<AlignedCodonFrame> dnaToCdsMaps = MappingUtils

2097

.findMappingsForSequence(cdsSeq, seqMappings);

2098

if (!dnaToCdsMaps.isEmpty())

{

return cdsSeq;

}

}

}

}

}

return null;

}

/**

* Helper method that makes a CDS sequence as defined by the mappings from the

2111

* given sequence i.e. extracts the 'mapped from' ranges (which may be on

2112

* forward or reverse strand).

* @param seq

* @param mapping

* @param dataset

* - existing dataset. We check for sequences that look like the CDS

2118

* we are about to construct, if one exists already, then we will

2119

* just return that one.

2120

* @return CDS sequence (as a dataset sequence)

2121

2122

static SequenceI makeCdsSequence(SequenceI seq, Mapping mapping,

AlignmentI dataset)

{

* construct CDS sequence name as "CDS|" with 'from id' held in the mapping

2127

* if set (e.g. EMBL protein_id), else sequence name appended

2128

2129

String mapFromId = mapping.getMappedFromId();

2130

final String seqId = "CDS|"

2131

+ (mapFromId != null ? mapFromId : seq.getName());

2132

2133

SequenceI newSeq = null;

2134

2135

2136

* construct CDS sequence by splicing mapped from ranges

2137

2138

char[] seqChars = seq.getSequence();

2139

List<int[]> fromRanges = mapping.getMap().getFromRanges();

2140

int cdsWidth = MappingUtils.getLength(fromRanges);

2141

char[] newSeqChars = new char[cdsWidth];

2142

2143

int newPos = 0;

2144

for (int[] range : fromRanges)

2145

{

2146

if (range[0] <= range[1])

2147

{

2148

// forward strand mapping - just copy the range

2149

int length = range[1] - range[0] + 1;

2150

System.arraycopy(seqChars, range[0] - 1, newSeqChars, newPos,

length);

newPos += length;

}

else

{

// reverse strand mapping - copy and complement one by one

2157

for (int i = range[0]; i >= range[1]; i--)

2158

{

2159

newSeqChars[newPos++] = Dna.getComplement(seqChars[i - 1]);

}

}

newSeq = new Sequence(seqId, newSeqChars, 1, newPos);

}

if (dataset != null)

{

SequenceI[] matches = dataset.findSequenceMatch(newSeq.getName());

2169

if (matches != null)

2170

{

2171

boolean matched = false;

2172

for (SequenceI mtch : matches)

2173

{

2174

if (mtch.getStart() != newSeq.getStart())

{

continue;

}

if (mtch.getEnd() != newSeq.getEnd())

{

continue;

}

if (!Arrays.equals(mtch.getSequence(), newSeq.getSequence()))

{

continue;

}

if (!matched)

{

matched = true;

newSeq = mtch;

}

else

{

Console.error(

"JAL-2154 regression: warning - found (and ignored) a duplicate CDS sequence:"

+ mtch.toString());

}

}

}

}

// newSeq.setDescription(mapFromId);

return newSeq;

}

/**

* Adds any DBRefEntrys to cdsSeq from contig that have a Mapping congruent to

* the given mapping.

* @param cdsSeq

* @param contig

* @param proteinProduct

2212

* @param mapping

2213

* @return list of DBRefEntrys added

2214

2215

protected static List<DBRefEntry> propagateDBRefsToCDS(SequenceI cdsSeq,

2216

SequenceI contig, SequenceI proteinProduct, Mapping mapping)

2217

{

2218

2219

// gather direct refs from contig congruent with mapping

2220

List<DBRefEntry> direct = new ArrayList<>();

2221

HashSet<String> directSources = new HashSet<>();

2222

2223

List<DBRefEntry> refs = contig.getDBRefs();

2224

if (refs != null)

2225

{

2226

292

for (int ib = 0, nb = refs.size(); ib < nb; ib++)

2227

{

2228

279

DBRefEntry dbr = refs.get(ib);

2229

279

MapList map;

2230

if (dbr.hasMap() && (map = dbr.getMap().getMap()).isTripletMap())

2231

{

2232

// check if map is the CDS mapping

2233

if (mapping.getMap().equals(map))

2234

{

2235

direct.add(dbr);

2236

directSources.add(dbr.getSource());

}

}

}

}

List<DBRefEntry> onSource = DBRefUtils.selectRefs(

2242

proteinProduct.getDBRefs(),

2243

directSources.toArray(new String[0]));

2244

List<DBRefEntry> propagated = new ArrayList<>();

2245

2246

// and generate appropriate mappings

2247

for (int ic = 0, nc = direct.size(); ic < nc; ic++)

2248

{

2249

DBRefEntry cdsref = direct.get(ic);

2250

Mapping m = cdsref.getMap();

2251

// clone maplist and mapping

2252

MapList cdsposmap = new MapList(

2253

Arrays.asList(new int[][]

2254

{ new int[] { cdsSeq.getStart(), cdsSeq.getEnd() } }),

2255

m.getMap().getToRanges(), 3, 1);

2256

Mapping cdsmap = new Mapping(m.getTo(), m.getMap());

2257

2258

// create dbref

2259

DBRefEntry newref = new DBRefEntry(cdsref.getSource(),

2260

cdsref.getVersion(), cdsref.getAccessionId(),

2261

new Mapping(cdsmap.getTo(), cdsposmap));

2262

2263

// and see if we can map to the protein product for this mapping.

2264

// onSource is the filtered set of accessions on protein that we are

2265

// tranferring, so we assume accession is the same.

2266

if (cdsmap.getTo() == null && onSource != null)

2267

{

2268

List<DBRefEntry> sourceRefs = DBRefUtils.searchRefs(onSource,

2269

cdsref.getAccessionId());

2270

if (sourceRefs != null)

2271

{

2272

for (DBRefEntry srcref : sourceRefs)

2273

{

2274

if (srcref.getSource().equalsIgnoreCase(cdsref.getSource()))

2275

{

2276

// we have found a complementary dbref on the protein product, so

2277

// update mapping's getTo

2278

newref.getMap().setTo(proteinProduct);

}

}

}

}

cdsSeq.addDBRef(newref);

2284

propagated.add(newref);

}

return propagated;

}

/**

* Transfers co-located features on 'fromSeq' to 'toSeq', adjusting the

2291

* feature start/end ranges, optionally omitting specified feature types.

2292

* Returns the number of features copied.

* @param fromSeq

* @param toSeq

* @param mapping

* the mapping from 'fromSeq' to 'toSeq'

2298

* @param select

2299

* if not null, only features of this type are copied (including

2300

* subtypes in the Sequence Ontology)

2301

* @param omitting

2302

2303

protected static int transferFeatures(SequenceI fromSeq, SequenceI toSeq,

2304

MapList mapping, String select, String... omitting)

2305

{

2306

SequenceI copyTo = toSeq;

2307

while (copyTo.getDatasetSequence() != null)

2308

{

2309

copyTo = copyTo.getDatasetSequence();

2310

}

2311

if (fromSeq == copyTo || fromSeq.getDatasetSequence() == copyTo)

2312

{

2313

return 0; // shared dataset sequence

}

* get features, optionally restricted by an ontology term

2318

2319

List<SequenceFeature> sfs = select == null

2320

? fromSeq.getFeatures().getPositionalFeatures()

2321

: fromSeq.getFeatures().getFeaturesByOntology(select);

2322

2323

int count = 0;

2324

for (SequenceFeature sf : sfs)

2325

{

2326

9610

String type = sf.getType();

2327

9610

boolean omit = false;

2328

9610

for (String toOmit : omitting)

2329

{

2330

9603

if (type.equals(toOmit))

2331

{

2332

134

omit = true;

2333

}

2334

}

2335

9610

if (omit)

2336

{

2337

134

continue;

}

* locate the mapped range - null if either start or end is

2342

* not mapped (no partial overlaps are calculated)

2343

2344

9476

int start = sf.getBegin();

2345

9476

int end = sf.getEnd();

2346

9476

int[] mappedTo = mapping.locateInTo(start, end);

2347

2348

* if whole exon range doesn't map, try interpreting it

2349

* as 5' or 3' exon overlapping the CDS range

2350

2351

9476

if (mappedTo == null)

2352

{

2353

4447

mappedTo = mapping.locateInTo(end, end);

2354

4447

if (mappedTo != null)

2355

{

2356

2357

* end of exon is in CDS range - 5' overlap

2358

* to a range from the start of the peptide

mappedTo[0] = 1;

}

}

9476

if (mappedTo == null)

2364

{

2365

4447

mappedTo = mapping.locateInTo(start, start);

2366

4447

if (mappedTo != null)

2367

{

2368

2369

* start of exon is in CDS range - 3' overlap

2370

* to a range up to the end of the peptide

2371

2372

mappedTo[1] = toSeq.getLength();

2373

}

2374

}

2375

9476

if (mappedTo != null)

2376

{

2377

5029

int newBegin = Math.min(mappedTo[0], mappedTo[1]);

2378

5029

int newEnd = Math.max(mappedTo[0], mappedTo[1]);

2379

5029

SequenceFeature copy = new SequenceFeature(sf, newBegin, newEnd,

2380

sf.getFeatureGroup(), sf.getScore());

2381

5029

copyTo.addSequenceFeature(copy);

2382

5029

count++;

}

}

return count;

}

/**

* Returns a mapping from dna to protein by inspecting sequence features of

2390

* type "CDS" on the dna. A mapping is constructed if the total CDS feature

2391

* length is 3 times the peptide length (optionally after dropping a trailing

2392

* stop codon). This method does not check whether the CDS nucleotide sequence

2393

* translates to the peptide sequence.

* @param dnaSeq

* @param proteinSeq

* @return

public static MapList mapCdsToProtein(SequenceI dnaSeq,

2400

SequenceI proteinSeq)

2401

{

2402

List<int[]> ranges = findCdsPositions(dnaSeq);

2403

int mappedDnaLength = MappingUtils.getLength(ranges);

2404

2405

2406

* if not a whole number of codons, truncate mapping

2407

2408

int codonRemainder = mappedDnaLength % CODON_LENGTH;

2409

if (codonRemainder > 0)

2410

{

2411

mappedDnaLength -= codonRemainder;

2412

MappingUtils.removeEndPositions(codonRemainder, ranges);

2413

}

2414

2415

int proteinLength = proteinSeq.getLength();

2416

int proteinStart = proteinSeq.getStart();

2417

int proteinEnd = proteinSeq.getEnd();

2418

2419

2420

* incomplete start codon may mean X at start of peptide

2421

* we ignore both for mapping purposes

2422

2423

if (proteinSeq.getCharAt(0) == 'X')

2424

{

2425

// todo JAL-2022 support startPhase > 0

proteinStart++;

proteinLength--;

}

List<int[]> proteinRange = new ArrayList<>();

2430

2431

2432

* dna length should map to protein (or protein plus stop codon)

2433

2434

int codesForResidues = mappedDnaLength / CODON_LENGTH;

2435

if (codesForResidues == (proteinLength + 1))

2436

{

2437

// assuming extra codon is for STOP and not in peptide

2438

// todo: check trailing codon is indeed a STOP codon

2439

codesForResidues--;

2440

mappedDnaLength -= CODON_LENGTH;

2441

MappingUtils.removeEndPositions(CODON_LENGTH, ranges);

2442

}

2443

2444

if (codesForResidues == proteinLength)

2445

{

2446

proteinRange.add(new int[] { proteinStart, proteinEnd });

2447

return new MapList(ranges, proteinRange, CODON_LENGTH, 1);

}

return null;

}

/**

* Returns a list of CDS ranges found (as sequence positions base 1), i.e. of

2454

* [start, end] positions of sequence features of type "CDS" (or a sub-type of

2455

* CDS in the Sequence Ontology). The ranges are sorted into ascending start

2456

* position order, so this method is only valid for linear CDS in the same

2457

* sense as the protein product.

* @param dnaSeq

* @return

protected static List<int[]> findCdsPositions(SequenceI dnaSeq)

2463

{

2464

List<int[]> result = new ArrayList<>();

2465

2466

List<SequenceFeature> sfs = dnaSeq.getFeatures()

2467

.getFeaturesByOntology(SequenceOntologyI.CDS);

if (sfs.isEmpty())

{

return result;

}

SequenceFeatures.sortFeatures(sfs, true);

2473

2474

for (SequenceFeature sf : sfs)

{

int phase = 0;

try

{

String s = sf.getPhase();

2480

if (s != null)

2481

{

2482

phase = Integer.parseInt(s);

2483

}

2484

} catch (NumberFormatException e)

{

// leave as zero

}

* phase > 0 on first codon means 5' incomplete - skip to the start

2490

* of the next codon; example ENST00000496384

2491

2492

int begin = sf.getBegin();

2493

int end = sf.getEnd();

2494

if (result.isEmpty() && phase > 0)

{

begin += phase;

if (begin > end)

{

// shouldn't happen!

System.err

.println("Error: start phase extends beyond start CDS in "

+ dnaSeq.getName());

}

}

result.add(new int[] { begin, end });

}

* Finally sort ranges by start position. This avoids a dependency on

2510

* keeping features in order on the sequence (if they are in order anyway,

2511

* the sort will have almost no work to do). The implicit assumption is CDS

2512

* ranges are assembled in order. Other cases should not use this method,

2513

* but instead construct an explicit mapping for CDS (e.g. EMBL parsing).

2514

2515

Collections.sort(result, IntRangeComparator.ASCENDING);

return result;

}

/**

* Makes an alignment with a copy of the given sequences, adding in any

2521

* non-redundant sequences which are mapped to by the cross-referenced

* sequences.

* @param seqs

* @param xrefs

* @param dataset

* the alignment dataset shared by the new copy

2528

* @return

2529

2530

public static AlignmentI makeCopyAlignment(SequenceI[] seqs,

2531

SequenceI[] xrefs, AlignmentI dataset)

2532

{

2533

AlignmentI copy = new Alignment(new Alignment(seqs));

2534

copy.setDataset(dataset);

2535

boolean isProtein = !copy.isNucleotide();

2536

SequenceIdMatcher matcher = new SequenceIdMatcher(seqs);

2537

if (xrefs != null)

2538

{

2539

// BH 2019.01.25 recoded to remove iterators

2540

2541

for (int ix = 0, nx = xrefs.length; ix < nx; ix++)

2542

{

2543

SequenceI xref = xrefs[ix];

2544

List<DBRefEntry> dbrefs = xref.getDBRefs();

2545

if (dbrefs != null)

2546

{

2547

for (int ir = 0, nir = dbrefs.size(); ir < nir; ir++)

2548

{

2549

DBRefEntry dbref = dbrefs.get(ir);

2550

Mapping map = dbref.getMap();

2551

SequenceI mto;

2552

if (map == null || (mto = map.getTo()) == null

2553

|| mto.isProtein() != isProtein)

{

continue;

}

SequenceI mappedTo = mto;

2558

SequenceI match = matcher.findIdMatch(mappedTo);

2559

if (match == null)

2560

{

2561

matcher.add(mappedTo);

2562

copy.addSequence(mappedTo);

}

}

}

}

}

return copy;

}

/**

* Try to align sequences in 'unaligned' to match the alignment of their

2573

* mapped regions in 'aligned'. For example, could use this to align CDS

2574

* sequences which are mapped to their parent cDNA sequences.

2575

2576

* This method handles 1:1 mappings (dna-to-dna or protein-to-protein). For

2577

* dna-to-protein or protein-to-dna use alternative methods.

2578

2579

* @param unaligned

2580

* sequences to be aligned

2581

* @param aligned

2582

* holds aligned sequences and their mappings

2583

* @return

2584

2585

public static int alignAs(AlignmentI unaligned, AlignmentI aligned)

2586

{

2587

2588

* easy case - aligning a copy of aligned sequences

2589

2590

if (alignAsSameSequences(unaligned, aligned))

2591

{

2592

return unaligned.getHeight();

}

* fancy case - aligning via mappings between sequences

2597

2598

List<SequenceI> unmapped = new ArrayList<>();

2599

Map<Integer, Map<SequenceI, Character>> columnMap = buildMappedColumnsMap(

2600

unaligned, aligned, unmapped);

2601

int width = columnMap.size();

2602

char gap = unaligned.getGapCharacter();

2603

int realignedCount = 0;

2604

// TODO: verify this loop scales sensibly for very wide/high alignments

2605

2606

for (SequenceI seq : unaligned.getSequences())

2607

{

2608

if (!unmapped.contains(seq))

2609

{

2610

char[] newSeq = new char[width];

2611

Arrays.fill(newSeq, gap); // JBPComment - doubt this is faster than the

2612

// Integer iteration below

int newCol = 0;

int lastCol = 0;

* traverse the map to find columns populated

2618

* by our sequence

2619

2620

for (Integer column : columnMap.keySet())

2621

{

2622

58976

Character c = columnMap.get(column).get(seq);

2623

58976

if (c != null)

2624

{

2625

2626

* sequence has a character at this position

2627

2628

2629

31986

newSeq[newCol] = c;

2630

31986

lastCol = newCol;

2631

}

2632

58976

newCol++;

}

* trim trailing gaps

if (lastCol < width)

{

char[] tmp = new char[lastCol + 1];

2641

System.arraycopy(newSeq, 0, tmp, 0, lastCol + 1);

2642

newSeq = tmp;

2643

}

2644

// TODO: optimise SequenceI to avoid char[]->String->char[]

2645

seq.setSequence(String.valueOf(newSeq));

realignedCount++;

}

}

return realignedCount;

}

/**

* If unaligned and aligned sequences share the same dataset sequences, then

2654

* simply copies the aligned sequences to the unaligned sequences and returns

2655

* true; else returns false

2656

2657

* @param unaligned

2658

* - sequences to be aligned based on aligned

2659

* @param aligned

2660

* - 'guide' alignment containing sequences derived from same dataset

* as unaligned

* @return

static boolean alignAsSameSequences(AlignmentI unaligned,

2665

AlignmentI aligned)

2666

{

2667

if (aligned.getDataset() == null || unaligned.getDataset() == null)

2668

{

2669

return false; // should only pass alignments with datasets here

2670

}

2671

2672

// map from dataset sequence to alignment sequence(s)

2673

Map<SequenceI, List<SequenceI>> alignedDatasets = new HashMap<>();

2674

for (SequenceI seq : aligned.getSequences())

2675

{

2676

SequenceI ds = seq.getDatasetSequence();

2677

if (alignedDatasets.get(ds) == null)

2678

{

2679

alignedDatasets.put(ds, new ArrayList<SequenceI>());

2680

}

2681

alignedDatasets.get(ds).add(seq);

}

* first pass - check whether all sequences to be aligned share a

2686

* dataset sequence with an aligned sequence; also note the leftmost

2687

* ungapped column from which to copy

2688

2689

int leftmost = Integer.MAX_VALUE;

2690

for (SequenceI seq : unaligned.getSequences())

2691

{

2692

final SequenceI ds = seq.getDatasetSequence();

2693

if (!alignedDatasets.containsKey(ds))

{

return false;

}

SequenceI alignedSeq = alignedDatasets.get(ds).get(0);

2698

int startCol = alignedSeq.findIndex(seq.getStart()); // 1..

2699

leftmost = Math.min(leftmost, startCol);

}

* second pass - copy aligned sequences;

2704

* heuristic rule: pair off sequences in order for the case where

2705

* more than one shares the same dataset sequence

2706

2707

final char gapCharacter = aligned.getGapCharacter();

2708

for (SequenceI seq : unaligned.getSequences())

2709

{

2710

List<SequenceI> alignedSequences = alignedDatasets

2711

.get(seq.getDatasetSequence());

2712

if (alignedSequences.isEmpty())

2713

{

2714

2715

* defensive check - shouldn't happen! (JAL-3536)

continue;

}

SequenceI alignedSeq = alignedSequences.get(0);

2720

2721

2722

* gap fill for leading (5') UTR if any

2723

2724

// TODO this copies intron columns - wrong!

2725

int startCol = alignedSeq.findIndex(seq.getStart()); // 1..

2726

int endCol = alignedSeq.findIndex(seq.getEnd());

2727

char[] seqchars = new char[endCol - leftmost + 1];

2728

Arrays.fill(seqchars, gapCharacter);

2729

char[] toCopy = alignedSeq.getSequence(startCol - 1, endCol);

2730

System.arraycopy(toCopy, 0, seqchars, startCol - leftmost,

2731

toCopy.length);

2732

seq.setSequence(String.valueOf(seqchars));

2733

if (alignedSequences.size() > 0)

2734

{

2735

// pop off aligned sequences (except the last one)

2736

alignedSequences.remove(0);

}

}

* finally remove gapped columns (e.g. introns)

2742

2743

new RemoveGapColCommand("", unaligned.getSequencesArray(), 0,

2744

unaligned.getWidth() - 1, unaligned);

return true;

}

/**

* Returns a map whose key is alignment column number (base 1), and whose

2751

* values are a map of sequence characters in that column.

* @param unaligned

* @param aligned

* @param unmapped

* @return

static SortedMap<Integer, Map<SequenceI, Character>> buildMappedColumnsMap(

2759

AlignmentI unaligned, AlignmentI aligned,

2760

List<SequenceI> unmapped)

2761

{

2762

2763

* Map will hold, for each aligned column position, a map of

2764

* {unalignedSequence, characterPerSequence} at that position.

2765

* TreeMap keeps the entries in ascending column order.

2766

2767

SortedMap<Integer, Map<SequenceI, Character>> map = new TreeMap<>();

2768

2769

2770

* record any sequences that have no mapping so can't be realigned

2771

2772

unmapped.addAll(unaligned.getSequences());

2773

2774

List<AlignedCodonFrame> mappings = aligned.getCodonFrames();

2775

2776

for (SequenceI seq : unaligned.getSequences())

2777

{

2778

for (AlignedCodonFrame mapping : mappings)

2779

{

2780

510

SequenceI fromSeq = mapping.findAlignedSequence(seq, aligned);

2781

510

if (fromSeq != null)

2782

{

2783

Mapping seqMap = mapping.getMappingBetween(fromSeq, seq);

2784

if (addMappedPositions(seq, fromSeq, seqMap, map))

2785

{

2786

unmapped.remove(seq);

}

}

}

}

return map;

}

/**

* Helper method that adds to a map the mapped column positions of a sequence.

2796

* <br>

2797

* For example if aaTT-Tg-gAAA is mapped to TTTAAA then the map should record

2798

* that columns 3,4,6,10,11,12 map to characters T,T,T,A,A,A of the mapped to

* sequence.

* @param seq

* the sequence whose column positions we are recording

2803

* @param fromSeq

2804

* a sequence that is mapped to the first sequence

2805

* @param seqMap

2806

* the mapping from 'fromSeq' to 'seq'

2807

* @param map

2808

* a map to add the column positions (in fromSeq) of the mapped

* positions of seq

* @return

static boolean addMappedPositions(SequenceI seq, SequenceI fromSeq,

2813

Mapping seqMap, Map<Integer, Map<SequenceI, Character>> map)

{

if (seqMap == null)

{

return false;

}

* invert mapping if it is from unaligned to aligned sequence

2822

2823

if (seqMap.getTo() == fromSeq.getDatasetSequence())

2824

{

2825

seqMap = new Mapping(seq.getDatasetSequence(),

2826

seqMap.getMap().getInverse());

2827

}

2828

2829

int toStart = seq.getStart();

2830

2831

2832

* traverse [start, end, start, end...] ranges in fromSeq

2833

2834

for (int[] fromRange : seqMap.getMap().getFromRanges())

2835

{

2836

for (int i = 0; i < fromRange.length - 1; i += 2)

2837

{

2838

boolean forward = fromRange[i + 1] >= fromRange[i];

2839

2840

2841

* find the range mapped to (sequence positions base 1)

2842

2843

int[] range = seqMap.locateMappedRange(fromRange[i],

fromRange[i + 1]);

if (range == null)

{

jalview.bin.Console.errPrintln("Error in mapping " + seqMap

2848

+ " from " + fromSeq.getName());

2849

return false;

2850

}

2851

int fromCol = fromSeq.findIndex(fromRange[i]);

2852

int mappedCharPos = range[0];

2853

2854

2855

* walk over the 'from' aligned sequence in forward or reverse

2856

* direction; when a non-gap is found, record the column position

2857

* of the next character of the mapped-to sequence; stop when all

2858

* the characters of the range have been counted

2859

2860

2794274

while (mappedCharPos <= range[1] && fromCol <= fromSeq.getLength()

2861

&& fromCol >= 0)

2862

{

2863

2794243

if (!Comparison.isGap(fromSeq.getCharAt(fromCol - 1)))

2864

{

2865

2866

* mapped from sequence has a character in this column

2867

* record the column position for the mapped to character

2868

2869

31998

Map<SequenceI, Character> seqsMap = map.get(fromCol);

2870

31998

if (seqsMap == null)

2871

{

2872

5398

seqsMap = new HashMap<>();

2873

5398

map.put(fromCol, seqsMap);

2874

}

2875

31998

seqsMap.put(seq, seq.getCharAt(mappedCharPos - toStart));

2876

31998

mappedCharPos++;

2877

}

2878

2794243

fromCol += (forward ? 1 : -1);

}

}

}

return true;

}

// strictly temporary hack until proper criteria for aligning protein to cds

2886

// are in place; this is so Ensembl -> fetch xrefs Uniprot aligns the Uniprot

2887

public static boolean looksLikeEnsembl(AlignmentI alignment)

2888

{

2889

for (SequenceI seq : alignment.getSequences())

2890

{

2891

String name = seq.getName();

2892

if (!name.startsWith("ENSG") && !name.startsWith("ENST"))

{

return false;

}

}

return true;

}

public static boolean isSecondaryStructurePresent(

2901

AlignmentAnnotation[] annotations)

2902

{

2903

boolean ssPresent = false;

2904

2905

for (AlignmentAnnotation aa : annotations)

{

if (ssPresent)

{

break;

}

if (Constants.SECONDARY_STRUCTURE_LABELS.containsKey(aa.label))

{

ssPresent = true;

break;

}

}

return ssPresent;

}

public static Color getSecondaryStructureAnnotationColour(char symbol)

2924

{

2925

2926

if (symbol == Constants.COIL)

{

return Color.gray;

}

if (symbol == Constants.SHEET)

{

return Color.green;

}

if (symbol == Constants.HELIX)

{

return Color.red;

}

return Color.white;

}

70406

public static char findSSAnnotationForGivenSeqposition(

2943

AlignmentAnnotation aa, int seqPosition)

2944

{

2945

70406

char ss = '*';

2946

2947

70406

if (aa != null)

2948

{

2949

70406

if (aa.getAnnotationForPosition(seqPosition) != null)

2950

{

2951

41428

Annotation a = aa.getAnnotationForPosition(seqPosition);

2952

41425

ss = a.secondaryStructure;

2953

2954

// There is no representation for coil and it can be either ' ' or null.

2955

41428

if (ss == ' ' || ss == '-')

2956

{

2957

9747

ss = Constants.COIL;

}

}

else

{

28978

ss = Constants.COIL;

}

}

70406

return ss;

2967

}

2968

2969

1674

public static List<String> extractSSSourceInAlignmentAnnotation(

2970

AlignmentAnnotation[] annotations)

2971

{

2972

2973

1674

List<String> ssSources = new ArrayList<>();

2974

1674

Set<String> addedSources = new HashSet<>(); // to keep track of added

2975

// sources

2976

2977

1674

if (annotations == null)

{

return ssSources;

}

1662

for (AlignmentAnnotation aa : annotations)

2983

{

2984

2985

7817

String ssSource = extractSSSourceFromAnnotationDescription(aa);

2986

2987

7817

if (ssSource != null && !addedSources.contains(ssSource))

2988

{

2989

ssSources.add(ssSource);

2990

addedSources.add(ssSource);

}

}

1662

Collections.sort(ssSources);

2995

2996

1662

return ssSources;

}

61843

public static String extractSSSourceFromAnnotationDescription(

3001

AlignmentAnnotation aa)

3002

{

3003

3004

61843

for (String label : Constants.SECONDARY_STRUCTURE_LABELS.keySet())

3005

{

3006

3007

69036

if (label.equals(aa.label))

3008

{

3009

3010

54652

if (aa.getProperty(Constants.SS_PROVIDER_PROPERTY) != null)

3011

{

3012

3013

return aa.getProperty(Constants.SS_PROVIDER_PROPERTY);

}

// For JPred

54653

if (Constants.SS_ANNOTATION_FROM_JPRED_LABEL.equals(aa.label))

3019

{

3020

3021

return (Constants.SECONDARY_STRUCTURE_LABELS.get(aa.label));

}

// For input with secondary structure

3026

54653

if (Constants.SS_ANNOTATION_LABEL.equals(aa.label)

3027

&& aa.description != null

3028

&& Constants.SS_ANNOTATION_LABEL.equals(aa.description))

3029

{

3030

3031

17329

return (Constants.SECONDARY_STRUCTURE_LABELS.get(aa.label));

}

// For other sources

37324

if (aa.sequenceRef == null)

3037

{

3038

168

return null;

3039

}

3040

37156

else if (aa.sequenceRef.getDatasetSequence() == null)

{

return null;

}

37156

Vector<PDBEntry> pdbEntries = aa.sequenceRef.getDatasetSequence()

3045

.getAllPDBEntries();

3046

3047

// TODO: this is an incredibly fragile mechanism

3048

37156

for (PDBEntry entry : pdbEntries)

3049

{

3050

3051

45270

String entryProvider = entry.getProvider();

3052

45270

if (entryProvider == null)

3053

{

3054

// No provider - so this is either an old Jalview project, or not

3055

// retrieved from recognised source

3056

45270

entryProvider = "PDB";

3057

}

3058

3059

// Should (re)use a standard mechanism for extracting the PDB ID as it

3060

// is written 1QWXTUV:CHAIN

3061

// Trim the string from first occurrence of colon

3062

45270

String entryID = entry.getId();

3063

45270

int index = entryID.indexOf(':');

3064

3065

// Check if colon exists

3066

45270

if (index != -1)

3067

{

3068

3069

// Trim the string from first occurrence of colon

3070

entryID = entryID.substring(0, index);

}

// TODO: shouldn't need to extract from description what the

3075

// originating ID is for this annotation!

3076

45270

if (entryProvider == "PDB" && aa.description.toLowerCase()

3077

.contains("secondary structure for "

3078

+ entryID.toLowerCase()))

3079

{

3080

3081

37156

return entryProvider;

}

8114

else if (entryProvider != "PDB" && aa.description.toLowerCase()

3086

.contains(entryID.toLowerCase()))

3087

{

3088

3089

return entryProvider;

}

}

}

}

7192

return null;

}

// to do set priority for labels

3102

10826552

public static List<AlignmentAnnotation> getAlignmentAnnotationForSource(

3103

SequenceI seq, String ssSource)

3104

{

3105

3106

10827920

List<AlignmentAnnotation> ssAnnots = new ArrayList<AlignmentAnnotation>();

3107

10835360

for (String ssLabel : Constants.SECONDARY_STRUCTURE_LABELS.keySet())

3108

{

3109

3110

21475438

AlignmentAnnotation[] aa = seq.getAnnotation(ssLabel);

3111

21189853

if (aa != null)

3112

{

3113

3114

99300

if (Constants.SS_ALL_PROVIDERS.equals(ssSource))

3115

{

3116

49656

ssAnnots.addAll(Arrays.asList(aa));

3117

49656

continue;

3118

}

3119

3120

49644

for (AlignmentAnnotation annot : aa)

3121

{

3122

3123

54028

String ssSourceForAnnot = extractSSSourceFromAnnotationDescription(

3124

annot);

3125

54028

if (ssSourceForAnnot != null && ssSource.equals(ssSourceForAnnot))

3126

{

3127

54028

ssAnnots.add(annot);

}

}

}

}

10852554

if (ssAnnots.size() > 0)

3133

{

3134

99297

return ssAnnots;

3135

}

3136

3137

10742578

return null;

}

public static Map<SequenceI, ArrayList<AlignmentAnnotation>> getSequenceAssociatedAlignmentAnnotations(

3142

AlignmentAnnotation[] alignAnnotList, String selectedSSSource)

3143

{

3144

3145

Map<SequenceI, ArrayList<AlignmentAnnotation>> ssAlignmentAnnotationForSequences = new HashMap<SequenceI, ArrayList<AlignmentAnnotation>>();

3146

if (alignAnnotList == null || alignAnnotList.length == 0)

3147

{

3148

return ssAlignmentAnnotationForSequences;

3149

}

3150

3151

for (AlignmentAnnotation aa : alignAnnotList)

3152

{

3153

if (aa.sequenceRef == null)

{

continue;

}

if (isSecondaryStructureFrom(selectedSSSource, aa))

3159

{

3160

ssAlignmentAnnotationForSequences

3161

.computeIfAbsent(aa.sequenceRef.getDatasetSequence(),

3162

k -> new ArrayList<>())

.add(aa);

}

}

return ssAlignmentAnnotationForSequences;

}

/**

* @param selectedSSSource

3174

* @param aa

3175

* @return true if aa is from a provider or all providers as specified by

3176

* selectedSSSource

3177

3178

public static boolean isSecondaryStructureFrom(String selectedSSSource,

3179

AlignmentAnnotation aa)

3180

{

3181

3182

for (String label : Constants.SECONDARY_STRUCTURE_LABELS.keySet())

3183

{

3184

3185

if (label.equals(aa.label))

3186

{

3187

3188

if (selectedSSSource.equals(Constants.SS_ALL_PROVIDERS))

{

return true;

}

String ssSource = AlignmentUtils

3193

.extractSSSourceFromAnnotationDescription(aa);

3194

if (ssSource != null && ssSource.equals(selectedSSSource))

{

return true;

}

}

}

return false;

}

// Method to get the key for a given provider value

3204

public static String getSecondaryStructureProviderKey(

3205

String providerValue)

3206

{

3207

for (Map.Entry<String, String> entry : Constants.STRUCTURE_PROVIDERS

3208

.entrySet())

3209

{

3210

if (entry.getValue().equals(providerValue))

3211

{

3212

return entry.getKey(); // Return the key (abbreviation) for the matching

// provider value

}

}

return null; // Return null if no match is found

3217

}

3218

3219

public static String reduceLabelLength(String label)

3220

{

3221

// Split the input by " | "

3222

String[] parts = label.split(" \\| ");

3223

3224

// Map the full names to their abbreviations

3225

String reducedLabel = Arrays.stream(parts)

3226

.map(fullName -> Constants.STRUCTURE_PROVIDERS.entrySet()

3227

.stream()

3228

.filter(entry -> entry.getValue().equals(fullName))

3229

.map(Map.Entry::getKey).findFirst().orElse(fullName)) // Use

// fullName

// if

// no

// abbreviation

// is

// found

.collect(Collectors.joining(" | "));

3237

3238

return reducedLabel; // Return the reduced label if abbreviations were

// applied

}

public static Color getSecondaryStructureProviderColor(String label)

3243

{

3244

3245

// return Constants.STRUCTURE_PROVIDERS_COLOR.getOrDefault(label,

3246

// Color.BLACK);

3247

Color c = Constants.STRUCTURE_PROVIDERS_COLOR.get(label.trim());

if (c == null)

c = Color.BLACK;

return c;

}

public static void assignSecondaryStructureProviderColor(

3254

Map<String, Color> secondaryStructureProviderColorMap,

List<String> labels)

{

// Use a Set to track unique labels

3259

Set<String> uniqueLabels = new HashSet<>(labels);

3260

3261

Color[] palette = ColorBrewer.Paired

3262

.getColorPalette(uniqueLabels.size());

3263

3264

List<Color> colorList = new ArrayList<>();

3265

Collections.addAll(colorList, palette);

3266

Collections.shuffle(colorList);

3267

int i = 0;

3268

3269

// Loop through each unique label and add it to the map with a color.

3270

// for (String label : uniqueLabels)

3271

for (String label : labels)

3272

{

3273

// Generate or retrieve a color for the label.

3274

String name = label.toUpperCase(Locale.ROOT).trim();

3275

secondaryStructureProviderColorMap.put(name,

3276

// ColorUtils.getDefaultColourFromName(name));

3277

ColorUtils.getColourFromNameAndScheme(name, "DESATURATED"));

3278

// secondaryStructureProviderColorMap.put(label.toUpperCase().trim(),

3279

// colorList.get(i));

// i++;

}

}

}

Coverage Report

File AlignmentUtils.java

Coverage histogram

Code metrics

Classes

Class AlignmentUtils

Class AlignmentUtils.DnaVariant

Contributing tests

Contributing tests

Source view