File AlignmentUtils.java

Branches:

514

Statements:

1,034

Methods:

Classes:

LOC:

3,494

NCLOC:

2,188

Total complexity:

397

Complexity density:

0.38

Statements/Method:

15.21

Methods/Class:

Average method complexity:

5.84

Classes

Class	Line #	Total Statements	Complexity	TOTAL Coverage	Actions
AlignmentUtils	84	1,028	391	0.838327183.8%
AlignmentUtils.DnaVariant	100	6	6	0.00%

Class AlignmentUtils

Class AlignmentUtils	Line # 84	Total Statements 1,028	Complexity 391	TOTAL Coverage 0.838327183.8%
expandContext(AlignmentI,int) : AlignmentI expandContext(AlignmentI,int) : AlignmentI	141141	46.046	10.010	0.983871 0.98387198.4%
getSequenceIndex(AlignmentI,SequenceI) : int getSequenceIndex(AlignmentI,SequenceI) : int	247247	8.08	2.02	1.0 1.0100%
getSequencesByName(AlignmentI) : Map<String, List<SequenceI>> getSequencesByName(AlignmentI) : Map<String, List<SequenceI>>	270270	10.010	3.03	0.9285714 0.928571492.9%
mapProteinAlignmentToCdna(AlignmentI,AlignmentI) : boolean mapProteinAlignmentToCdna(AlignmentI,AlignmentI) : boolean	301301	7.07	3.03	0.7777778 0.777777877.8%
mapProteinToCdna(AlignmentI,AlignmentI,Set<SequenceI>,Set<SequenceI>,boolean) : boolean mapProteinToCdna(AlignmentI,AlignmentI,Set<SequenceI>,Set<SequenceI>,boolean) : boolean	343343	22.022	9.09	0.9375 0.937593.8%
mappingExists(List<AlignedCodonFrame>,SequenceI,SequenceI) : boolean mappingExists(List<AlignedCodonFrame>,SequenceI,SequenceI) : boolean	410410	5.05	3.03	0.6666667 0.666666766.7%
mapCdnaToProtein(SequenceI,SequenceI) : MapList mapCdnaToProtein(SequenceI,SequenceI) : MapList	443443	28.028	12.012	0.95238096 0.9523809695.2%
translatesAs(char[],int,char[]) : boolean translatesAs(char[],int,char[]) : boolean	533533	21.021	14.014	1.0 1.0100%
alignSequenceAs(SequenceI,AlignmentI,String,boolean,boolean) : boolean alignSequenceAs(SequenceI,AlignmentI,String,boolean,boolean) : boolean	610610	14.014	5.05	0.9 0.990%
alignSequenceAs(SequenceI,SequenceI,AlignedCodonFrame,String,char,boolean,boolean) : void alignSequenceAs(SequenceI,SequenceI,AlignedCodonFrame,String,char,boolean,boolean) : void	666666	60.060	20.020	1.0 1.0100%
calculateGapsToInsert(boolean,boolean,int,boolean,int,int,boolean) : int calculateGapsToInsert(boolean,boolean,int,boolean,int,int,boolean) : int	831831	15.015	10.010	1.0 1.0100%
alignProteinAsDna(AlignmentI,AlignmentI) : int alignProteinAsDna(AlignmentI,AlignmentI) : int	895895	6.06	3.03	0.625 0.62562.5%
alignCdsAsProtein(AlignmentI,AlignmentI) : int alignCdsAsProtein(AlignmentI,AlignmentI) : int	921921	18.018	5.05	0.8333333 0.833333383.3%
alignCdsSequenceAsProtein(SequenceI,AlignmentI,List<AlignedCodonFrame>,char) : boolean alignCdsSequenceAsProtein(SequenceI,AlignmentI,List<AlignedCodonFrame>,char) : boolean	967967	48.048	16.016	0.67105263 0.6710526367.1%
buildCodonColumnsMap(AlignmentI,AlignmentI,List<SequenceI>) : Map<AlignedCodon, Map<SequenceI, AlignedCodon>> buildCodonColumnsMap(AlignmentI,AlignmentI,List<SequenceI>) : Map<AlignedCodon, Map<SequenceI, AlignedCodon>>	10981098	13.013	2.02	1.0 1.0100%
addUnmappedPeptideStarts(Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,int) : void addUnmappedPeptideStarts(Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,int) : void	11541154	23.023	6.06	0.93939394 0.9393939493.9%
alignProteinAs(AlignmentI,Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,List<SequenceI>) : int alignProteinAs(AlignmentI,Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,List<SequenceI>) : int	12371237	17.017	2.02	1.0 1.0100%
addCodonPositions(SequenceI,SequenceI,char,Mapping,Map<AlignedCodon, Map<SequenceI, AlignedCodon>>) : void addCodonPositions(SequenceI,SequenceI,char,Mapping,Map<AlignedCodon, Map<SequenceI, AlignedCodon>>) : void	13021302	5.05	4.04	1.0 1.0100%
addCodonToMap(Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,AlignedCodon,SequenceI) : void addCodonToMap(Map<AlignedCodon, Map<SequenceI, AlignedCodon>>,AlignedCodon,SequenceI) : void	13351335	5.05	2.02	1.0 1.0100%
isMappable(AlignmentI,AlignmentI) : boolean isMappable(AlignmentI,AlignmentI) : boolean	13651365	14.014	9.09	1.0 1.0100%
check3diPeptideMapping(AlignmentI,AlignmentI) : boolean check3diPeptideMapping(AlignmentI,AlignmentI) : boolean	13991399	14.014	6.06	1.0 1.0100%
canBuild3diMapping(SequenceI,SequenceI) : boolean canBuild3diMapping(SequenceI,SequenceI) : boolean	14351435	5.05	2.02	1.0 1.0100%
map3diPeptideToProteinAligment(AlignmentI,AlignmentI) : boolean map3diPeptideToProteinAligment(AlignmentI,AlignmentI) : boolean	14511451	6.06	3.03	0.75 0.7575%
mapProteinToTdiAlignment(AlignmentI,AlignmentI,Set<SequenceI>,Set<SequenceI>) : boolean mapProteinToTdiAlignment(AlignmentI,AlignmentI,Set<SequenceI>,Set<SequenceI>) : boolean	14861486	20.020	6.06	0.8333333 0.833333383.3%
isMappable(SequenceI,SequenceI,List<AlignedCodonFrame>) : boolean isMappable(SequenceI,SequenceI,List<AlignedCodonFrame>) : boolean	15401540	8.08	6.06	0.625 0.62562.5%
findAddableReferenceAnnotations(List<SequenceI>,Map<String, String>,Map<SequenceI, List<AlignmentAnnotation>>,AlignmentI) : void findAddableReferenceAnnotations(List<SequenceI>,Map<String, String>,Map<SequenceI, List<AlignmentAnnotation>>,AlignmentI) : void	15871587	26.026	10.010	0.90909094 0.9090909490.9%
addReferenceAnnotations(Map<SequenceI, List<AlignmentAnnotation>>,AlignmentI,SequenceGroup) : void addReferenceAnnotations(Map<SequenceI, List<AlignmentAnnotation>>,AlignmentI,SequenceGroup) : void	16721672	3.03	1.01	1.0 1.0100%
isSSAnnotationPresent(Map<SequenceI, List<AlignmentAnnotation>>) : boolean isSSAnnotationPresent(Map<SequenceI, List<AlignmentAnnotation>>) : boolean	16851685	4.04	2.02	1.0 1.0100%
addReferenceAnnotationTo(AlignmentI,SequenceI,AlignmentAnnotation,SequenceGroup) : AlignmentAnnotation addReferenceAnnotationTo(AlignmentI,SequenceI,AlignmentAnnotation,SequenceGroup) : AlignmentAnnotation	17141714	16.016	4.04	0.95454544 0.9545454495.5%
showOrHideSequenceAnnotations(AlignmentI,Collection<String>,List<SequenceI>,boolean,boolean) : void showOrHideSequenceAnnotations(AlignmentI,Collection<String>,List<SequenceI>,boolean,boolean) : void	17691769	6.06	7.07	0.9166667 0.916666791.7%
showOrHideAutoCalculatedAnnotationsForGroup(AlignmentI,String,SequenceGroup,boolean,boolean) : void showOrHideAutoCalculatedAnnotationsForGroup(AlignmentI,String,SequenceGroup,boolean,boolean) : void	18061806	6.06	7.07	0.0 0.00%
getFirstSequenceAnnotationOfType(AlignmentI,int) : AlignmentAnnotation getFirstSequenceAnnotationOfType(AlignmentI,int) : AlignmentAnnotation	18341834	6.06	4.04	0.0 0.00%
haveCrossRef(SequenceI,SequenceI) : boolean haveCrossRef(SequenceI,SequenceI) : boolean	18561856	1.01	1.01	1.0 1.0100%
hasCrossRef(SequenceI,SequenceI) : boolean hasCrossRef(SequenceI,SequenceI) : boolean	18711871	11.011	6.06	1.0 1.0100%
makeCdsAlignment(SequenceI[],AlignmentI,SequenceI[]) : AlignmentI makeCdsAlignment(SequenceI[],AlignmentI,SequenceI[]) : AlignmentI	19121912	66.066	16.016	0.8913044 0.891304489.1%
transferGeneLoci(SequenceI,MapList,SequenceI) : void transferGeneLoci(SequenceI,MapList,SequenceI) : void	21392139	8.08	4.04	0.9285714 0.928571492.9%
findCdsForProtein(List<AlignedCodonFrame>,SequenceI,List<AlignedCodonFrame>,Mapping) : SequenceI findCdsForProtein(List<AlignedCodonFrame>,SequenceI,List<AlignedCodonFrame>,Mapping) : SequenceI	21772177	19.019	11.011	0.9354839 0.935483993.5%
makeCdsSequence(SequenceI,Mapping,AlignmentI) : SequenceI makeCdsSequence(SequenceI,Mapping,AlignmentI) : SequenceI	22642264	32.032	10.010	0.62 0.6262%
propagateDBRefsToCDS(SequenceI,SequenceI,SequenceI,Mapping) : List<DBRefEntry> propagateDBRefsToCDS(SequenceI,SequenceI,SequenceI,Mapping) : List<DBRefEntry>	23572357	28.028	11.011	0.8863636 0.886363688.6%
transferFeatures(SequenceI,SequenceI,MapList,String,String) : int transferFeatures(SequenceI,SequenceI,MapList,String,String) : int	24452445	33.033	12.012	0.8867925 0.886792588.7%
mapCdsToProtein(SequenceI,SequenceI) : MapList mapCdsToProtein(SequenceI,SequenceI) : MapList	25412541	22.022	5.05	1.0 1.0100%
findCdsPositions(SequenceI) : List<int[]> findCdsPositions(SequenceI) : List<int[]>	26042604	20.020	7.07	0.9285714 0.928571492.9%
makeCopyAlignment(SequenceI[],SequenceI[],AlignmentI) : AlignmentI makeCopyAlignment(SequenceI[],SequenceI[],AlignmentI) : AlignmentI	26722672	21.021	9.09	0.0 0.00%
alignAs(AlignmentI,AlignmentI) : int alignAs(AlignmentI,AlignmentI) : int	27272727	26.026	5.05	0.88235295 0.8823529588.2%
alignAsSameSequences(AlignmentI,AlignmentI) : boolean alignAsSameSequences(AlignmentI,AlignmentI) : boolean	28062806	33.033	7.07	0.88372093 0.8837209388.4%
buildMappedColumnsMap(AlignmentI,AlignmentI,List<SequenceI>) : SortedMap<Integer, Map<SequenceI, Character>> buildMappedColumnsMap(AlignmentI,AlignmentI,List<SequenceI>) : SortedMap<Integer, Map<SequenceI, Character>>	29002900	11.011	3.03	0.93333334 0.9333333493.3%
addMappedPositions(SequenceI,SequenceI,Mapping,Map<Integer, Map<SequenceI, Character>>) : boolean addMappedPositions(SequenceI,SequenceI,Mapping,Map<Integer, Map<SequenceI, Character>>) : boolean	29542954	24.024	11.011	0.85 0.8585%
looksLikeEnsembl(AlignmentI) : boolean looksLikeEnsembl(AlignmentI) : boolean	30293029	5.05	3.03	0.71428573 0.7142857371.4%
deepCopyAlignment(AlignmentI) : AlignmentI deepCopyAlignment(AlignmentI) : AlignmentI	30463046	12.012	4.04	0.0 0.00%
getSecondaryStructureAnnots(AlignmentAnnotation[]) : List<AlignmentAnnotation> getSecondaryStructureAnnots(AlignmentAnnotation[]) : List<AlignmentAnnotation>	30713071	10.010	6.06	0.0 0.00%
isSecondaryStructurePresent(AlignmentAnnotation[]) : boolean isSecondaryStructurePresent(AlignmentAnnotation[]) : boolean	31003100	11.011	6.06	0.88235295 0.8823529588.2%
getSecondaryStructureAnnotationColour(char) : Color getSecondaryStructureAnnotationColour(char) : Color	31323132	7.07	4.04	1.0 1.0100%
findSSAnnotationForGivenSeqposition(AlignmentAnnotation,int) : char findSSAnnotationForGivenSeqposition(AlignmentAnnotation,int) : char	31513151	9.09	5.05	0.93333334 0.9333333493.3%
extractSSSourceInAlignmentAnnotation(AlignmentAnnotation[]) : List<String> extractSSSourceInAlignmentAnnotation(AlignmentAnnotation[]) : List<String>	31783178	11.011	4.04	1.0 1.0100%
getAlignmentAnnotationForSource(SequenceI,String) : List<AlignmentAnnotation> getAlignmentAnnotationForSource(SequenceI,String) : List<AlignmentAnnotation>	32163216	14.014	7.07	1.0 1.0100%
getSequenceAssociatedAlignmentAnnotations(AlignmentAnnotation[],String) : Map<SequenceI, ArrayList<AlignmentAnnotation>> getSequenceAssociatedAlignmentAnnotations(AlignmentAnnotation[],String) : Map<SequenceI, ArrayList<AlignmentAnnotation>>	32583258	9.09	5.05	0.8666667 0.866666786.7%
getSecondaryStructureAnnotionFor(List<AlignmentAnnotation>,String) : List<AlignmentAnnotation> getSecondaryStructureAnnotionFor(List<AlignmentAnnotation>,String) : List<AlignmentAnnotation>	32933293	5.05	2.02	0.0 0.00%
isSecondaryStructureFrom(String,AlignmentAnnotation) : boolean isSecondaryStructureFrom(String,AlignmentAnnotation) : boolean	33123312	8.08	5.05	1.0 1.0100%
getSecondaryStructureProviderKey(String) : String getSecondaryStructureProviderKey(String) : String	33383338	4.04	2.02	0.0 0.00%
reduceLabelLength(String) : String reduceLabelLength(String) : String	33533353	10.010	3.03	0.0 0.00%
assignColorsForSecondaryStructureProviders(List<String>) : HashMap<String, Color> assignColorsForSecondaryStructureProviders(List<String>) : HashMap<String, Color>	33733373	5.05	1.01	1.0 1.0100%
computeMaxShifts(SequenceI[],ShiftList) : int computeMaxShifts(SequenceI[],ShiftList) : int	33913391	22.022	8.08	1.0 1.0100%
a3mToMSA(SequenceI[]) : String a3mToMSA(SequenceI[]) : String	34433443	7.07	2.02	0.8888889 0.888888988.9%
insertShifts(SequenceI[],ShiftList) : int insertShifts(SequenceI[],ShiftList) : int	34573457	19.019	8.08	1.0 1.0100%

Class AlignmentUtils.DnaVariant

Class AlignmentUtils.DnaVariant	Line # 100	Total Statements 6	Complexity 6	TOTAL Coverage 0.00%
DnaVariant(String) DnaVariant(String)	106106	2.02	1.01	0.0 0.00%
DnaVariant(String,SequenceFeature) DnaVariant(String,SequenceFeature)	112112	2.02	1.01	0.0 0.00%
getSource() : String getSource() : String	118118	1.01	2.02	0.0 0.00%
toString() : String toString() : String	126126	1.01	2.02	0.0 0.00%

Contributing tests

This file is covered by 336 tests. .

Contributing tests

Test contribution	Test	Result
0.2660891	jalview.io.CrossRef2xmlTests.openCrossrefsForEnsemblTwicejalview.io.CrossRef2xmlTests.openCrossrefsForEnsemblTwice	1PASS
0.11386139	jalview.analysis.AlignmentUtilsTests.testMakeCdsAlignmentjalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment	1PASS
0.090965346	jalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_withXrefsjalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_withXrefs	1PASS
0.090965346	jalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_withStartAndStopCodonsjalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_withStartAndStopCodons	1PASS
0.089108914	jalview.datamodel.AlignmentTest.testAlignAs_tdi_protjalview.datamodel.AlignmentTest.testAlignAs_tdi_prot	1PASS
0.0884901	jalview.datamodel.AlignmentTest.testAlignAs_prot_tdijalview.datamodel.AlignmentTest.testAlignAs_prot_tdi	1PASS
0.083539605	jalview.analysis.AlignmentUtilsTests.testIsMappablejalview.analysis.AlignmentUtilsTests.testIsMappable	1PASS
0.08168317	jalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_multipleProteinsjalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_multipleProteins	1PASS
0.08106436	jalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_filterProductsjalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_filterProducts	1PASS
0.07920792	jalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_noXrefsjalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_noXrefs	1PASS
0.07735149	jalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_alternativeTranscriptsjalview.analysis.AlignmentUtilsTests.testMakeCdsAlignment_alternativeTranscripts	1PASS
0.07549505	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.074257426	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.074257426	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.0730198	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.0730198	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.0730198	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.0730198	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.0730198	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.07178218	jalview.bin.CommandsTest2.do_network_structureOpeningArgsTestjalview.bin.CommandsTest2.do_network_structureOpeningArgsTest	1PASS
0.07178218	jalview.bin.CommandsTest2.do_network_structureOpeningArgsTestjalview.bin.CommandsTest2.do_network_structureOpeningArgsTest	1PASS
0.07178218	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.07178218	jalview.bin.CommandsTest2.do_network_structureOpeningArgsTestjalview.bin.CommandsTest2.do_network_structureOpeningArgsTest	1PASS
0.07178218	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.07178218	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.07178218	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.07178218	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.070544556	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.070544556	jalview.io.FeaturesFileTest.simpleGff3FileLoaderjalview.io.FeaturesFileTest.simpleGff3FileLoader	1PASS
0.070544556	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.06745049	jalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_prioritiseXrefsjalview.analysis.AlignmentUtilsTests.testMapProteinAlignmentToCdna_prioritiseXrefs	1PASS
0.06621287	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_withIntronsjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_withIntrons	1PASS
0.06559406	jalview.io.FeaturesFileTest.simpleGff3RelaxedIdMatchingjalview.io.FeaturesFileTest.simpleGff3RelaxedIdMatching	1PASS
0.06373762	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_noIntronsjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_noIntrons	1PASS
0.060643565	jalview.project.Jalview2xmlTests.testSaveAndLoadAnnotationBasedTreejalview.project.Jalview2xmlTests.testSaveAndLoadAnnotationBasedTree	1PASS
0.060024753	jalview.io.FeaturesFileTest.simpleGff3FileClassjalview.io.FeaturesFileTest.simpleGff3FileClass	1PASS
0.05878713	jalview.analysis.AverageDistanceEngineTest.testUPGMAEnginejalview.analysis.AverageDistanceEngineTest.testUPGMAEngine	1PASS
0.05940594	jalview.project.Jalview2xmlTests.testSaveAndLoadAnnotationsPropertiesjalview.project.Jalview2xmlTests.testSaveAndLoadAnnotationsProperties	1PASS
0.060024753	jalview.io.FeaturesFileTest.readGff3Filejalview.io.FeaturesFileTest.readGff3File	1PASS
0.058168318	jalview.datamodel.AlignmentTest.testAlignAs_dnaAsDnajalview.datamodel.AlignmentTest.testAlignAs_dnaAsDna	1PASS
0.057549506	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_keepIntronGapsOnlyjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_keepIntronGapsOnly	1PASS
0.056930695	jalview.analysis.AlignmentUtilsTests.testAlignAs_alternateTranscriptsUngappedjalview.analysis.AlignmentUtilsTests.testAlignAs_alternateTranscriptsUngapped	1PASS
0.054455444	jalview.analysis.AlignmentUtilsTests.testAlignProteinAsDna_incompleteStartCodonjalview.analysis.AlignmentUtilsTests.testAlignProteinAsDna_incompleteStartCodon	1PASS
0.055074256	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_withUnmappedProteinjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withMapping_withUnmappedProtein	1PASS
0.053836633	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.053836633	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.053836633	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.053836633	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.05259901	jalview.gui.AnnotationLabelsTest2.testIdWidthNoChangesjalview.gui.AnnotationLabelsTest2.testIdWidthNoChanges	1PASS
0.05259901	jalview.gui.AnnotationLabelsTest2.testIdWidthNoChangesjalview.gui.AnnotationLabelsTest2.testIdWidthNoChanges	1PASS
0.05259901	jalview.gui.AnnotationLabelsTest2.testIdWidthChangesjalview.gui.AnnotationLabelsTest2.testIdWidthChanges	1PASS
0.05259901	jalview.gui.AnnotationLabelsTest2.testIdWidthChangesjalview.gui.AnnotationLabelsTest2.testIdWidthChanges	1PASS
0.051361386	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withTrailingPeptidejalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_withTrailingPeptide	1PASS
0.04950495	jalview.analysis.AlignmentUtilsTests.testAlignProteinAsDnajalview.analysis.AlignmentUtilsTests.testAlignProteinAsDna	1PASS
0.04888614	jalview.datamodel.AlignmentTest.testAlignAs_proteinAsCdnajalview.datamodel.AlignmentTest.testAlignAs_proteinAsCdna	1PASS
0.047029704	jalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_mappedProteinProteinjalview.analysis.AlignmentUtilsTests.testAlignSequenceAs_mappedProteinProtein	1PASS
0.047029704	jalview.ext.jmol.JmolViewerTest.testAddStrToSingleSeqViewJMoljalview.ext.jmol.JmolViewerTest.testAddStrToSingleSeqViewJMol	1PASS
0.04517327	jalview.datamodel.AlignmentTest.testAlignAs_cdnaAsProteinjalview.datamodel.AlignmentTest.testAlignAs_cdnaAsProtein	1PASS
0.043935645	jalview.datamodel.AlignmentTest.testAlignAs_cdnaAsProtein_singleSequencejalview.datamodel.AlignmentTest.testAlignAs_cdnaAsProtein_singleSequence	1PASS
0.044554457	jalview.analysis.AlignmentUtilsTests.testa3mToMSAjalview.analysis.AlignmentUtilsTests.testa3mToMSA	1PASS
0.04269802	jalview.analysis.AlignmentUtilsTests.testa3mToMSA_byfilejalview.analysis.AlignmentUtilsTests.testa3mToMSA_byfile	1PASS
0.04022277	jalview.project.Jalview2xmlTests.testRNAStructureRecoveryjalview.project.Jalview2xmlTests.testRNAStructureRecovery	1PASS
0.03960396	jalview.project.Jalview2xmlTests.testStoreAndRecoverPDBEntryjalview.project.Jalview2xmlTests.testStoreAndRecoverPDBEntry	1PASS
0.03960396	jalview.ext.jmol.JmolParserTest.testAlignmentLoaderjalview.ext.jmol.JmolParserTest.testAlignmentLoader	1PASS
0.03960396	jalview.ext.jmol.JmolViewerTest.testSingleSeqViewJMoljalview.ext.jmol.JmolViewerTest.testSingleSeqViewJMol	1PASS
0.03960396	jalview.io.AnnotatedPDBFileInputTest.testJalviewProjectRelocationAnnotationjalview.io.AnnotatedPDBFileInputTest.testJalviewProjectRelocationAnnotation	1PASS
0.035272278	jalview.analysis.AlignmentUtilsTests.testAddReferenceContactMapjalview.analysis.AlignmentUtilsTests.testAddReferenceContactMap	1PASS
0.03589109	jalview.analysis.AlignmentUtilsTests.testExpandContextjalview.analysis.AlignmentUtilsTests.testExpandContext	1PASS
0.034034654	jalview.project.Jalview2xmlTests.testPAEsaveRestorejalview.project.Jalview2xmlTests.testPAEsaveRestore	1PASS
0.034653466	jalview.analysis.AlignmentUtilsTests.testMapCdsToProteinjalview.analysis.AlignmentUtilsTests.testMapCdsToProtein	1PASS
0.034653466	jalview.ext.jmol.JmolParserTest.testFileParserjalview.ext.jmol.JmolParserTest.testFileParser	1PASS
0.031559408	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.03217822	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.03279703	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.03217822	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.03279703	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withGapjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withGap	1PASS
0.03279703	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.031559408	jalview.analysis.AlignmentUtilsTests.testAddReferenceAnnotationsjalview.analysis.AlignmentUtilsTests.testAddReferenceAnnotations	1PASS
0.029084159	jalview.analysis.AlignmentUtilsTests.testExpandContext_annotationjalview.analysis.AlignmentUtilsTests.testExpandContext_annotation	1PASS
0.02970297	jalview.datamodel.AlignmentTest.testAlignAs_3dijalview.datamodel.AlignmentTest.testAlignAs_3di	1PASS
0.027846534	jalview.analysis.AAFrequencyTest.testExtractSSProfileForSequenceGroupjalview.analysis.AAFrequencyTest.testExtractSSProfileForSequenceGroup	1PASS
0.027227722	jalview.analysis.AlignmentUtilsTests.testMapCdnaToProtein_forSubsequencejalview.analysis.AlignmentUtilsTests.testMapCdnaToProtein_forSubsequence	1PASS
0.024133664	jalview.analysis.AlignmentUtilsTests.testTransferFeaturesjalview.analysis.AlignmentUtilsTests.testTransferFeatures	1PASS
0.02289604	jalview.gui.AlignFrameTest.testNewView_colourThresholdsjalview.gui.AlignFrameTest.testNewView_colourThresholds	1PASS
0.02289604	jalview.project.Jalview2xmlTests.testTCoffeeScoresjalview.project.Jalview2xmlTests.testTCoffeeScores	1PASS
0.02289604	jalview.project.Jalview2xmlTests.testColourByAnnotScoresjalview.project.Jalview2xmlTests.testColourByAnnotScores	1PASS
0.023514852	jalview.analysis.AlignmentUtilsTests.testAlignAsSameSequencesjalview.analysis.AlignmentUtilsTests.testAlignAsSameSequences	1PASS
0.021658415	jalview.gui.AlignViewportTest.testGetSelectionAsNewSequences_withContactMatricesjalview.gui.AlignViewportTest.testGetSelectionAsNewSequences_withContactMatrices	1PASS
0.021658415	jalview.project.Jalview2xmlTests.testStoreAndRecoverAnnotationRowElementColoursjalview.project.Jalview2xmlTests.testStoreAndRecoverAnnotationRowElementColours	1PASS
0.022277229	jalview.analysis.AlignmentUtilsTests.testTransferFeatures_withOmitjalview.analysis.AlignmentUtilsTests.testTransferFeatures_withOmit	1PASS
0.02289604	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.023514852	jalview.analysis.AlignmentUtilsTests.testTranslatesAsjalview.analysis.AlignmentUtilsTests.testTranslatesAs	1PASS
0.02289604	jalview.analysis.AlignmentUtilsTests.testAlignAsSameSequencesMultipleSubSeqjalview.analysis.AlignmentUtilsTests.testAlignAsSameSequencesMultipleSubSeq	1PASS
0.02289604	jalview.project.Jalview2xmlTests.testStoreAndRecoverColourThresholdsjalview.project.Jalview2xmlTests.testStoreAndRecoverColourThresholds	1PASS
0.02289604	jalview.io.AnnotationFileIOTest.testProviderRestorejalview.io.AnnotationFileIOTest.testProviderRestore	1PASS
0.021658415	jalview.project.Jalview2xmlTests.testStoreAndRecoverHmmProfilejalview.project.Jalview2xmlTests.testStoreAndRecoverHmmProfile	1PASS
0.021658415	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInBothSeqsjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInBothSeqs	1PASS
0.021658415	jalview.gui.ColourMenuHelperTest.testAddMenuItems_nucleotidejalview.gui.ColourMenuHelperTest.testAddMenuItems_nucleotide	1PASS
0.01980198	jalview.analysis.AlignmentUtilsTests.testAddMappedPositionsjalview.analysis.AlignmentUtilsTests.testAddMappedPositions	1PASS
0.018564356	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInEitherOneSeqjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances_withSSUndefinedInEitherOneSeq	1PASS
0.019183168	jalview.gui.AnnotationChooserTest.testBuildApplyToOptionsPanel_noSelectionGroupjalview.gui.AnnotationChooserTest.testBuildApplyToOptionsPanel_noSelectionGroup	1PASS
0.01980198	jalview.analysis.AlignmentUtilsTests.testAddMappedPositions_withStopCodonjalview.analysis.AlignmentUtilsTests.testAddMappedPositions_withStopCodon	1PASS
0.019183168	jalview.gui.AppVarnaTest.testReplaceOddGapsjalview.gui.AppVarnaTest.testReplaceOddGaps	1PASS
0.019183168	jalview.gui.PopupMenuTest.testHideInsertionsjalview.gui.PopupMenuTest.testHideInsertions	1PASS
0.017945545	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_alreadyAddedjalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_alreadyAdded	1PASS
0.018564356	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenujalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu	1PASS
0.019183168	jalview.gui.AnnotationChooserTest.testSelectType_showForSelectedjalview.gui.AnnotationChooserTest.testSelectType_showForSelected	1PASS
0.019183168	jalview.gui.AlignFrameTest.testChangeColour_background_groupsAndThresholdsjalview.gui.AlignFrameTest.testChangeColour_background_groupsAndThresholds	1PASS
0.019183168	jalview.gui.AnnotationChooserTest.testResetOriginalStatejalview.gui.AnnotationChooserTest.testResetOriginalState	1PASS
0.01980198	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.018564356	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_notOnAlignmentjalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_notOnAlignment	1PASS
0.019183168	jalview.gui.AnnotationChooserTest.testDeselectType_hideForSelectedjalview.gui.AnnotationChooserTest.testDeselectType_hideForSelected	1PASS
0.017945545	jalview.analysis.AlignmentUtilsTests.testFindCdsForProtein_noUTRjalview.analysis.AlignmentUtilsTests.testFindCdsForProtein_noUTR	1PASS
0.018564356	jalview.analysis.AlignmentUtilsTests.testTransferFeatures_withSelectjalview.analysis.AlignmentUtilsTests.testTransferFeatures_withSelect	1PASS
0.019183168	jalview.gui.AnnotationChooserTest.testIsInActionScope_unselectedScopejalview.gui.AnnotationChooserTest.testIsInActionScope_unselectedScope	1PASS
0.019183168	jalview.gui.AnnotationChooserTest.testSelectType_hideForAlljalview.gui.AnnotationChooserTest.testSelectType_hideForAll	1PASS
0.01608911	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.gui.QuitHandlerTest.testUnsavedChangesjalview.gui.QuitHandlerTest.testUnsavedChanges	1PASS
0.01608911	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01608911	jalview.project.Jalview2xmlTests.viewRefPdbAnnotationjalview.project.Jalview2xmlTests.viewRefPdbAnnotation	1PASS
0.01608911	jalview.io.FeaturesFileTest.testParsejalview.io.FeaturesFileTest.testParse	1PASS
0.01608911	jalview.gui.ScalePanelTest.testPreventNegativeStartColumnjalview.gui.ScalePanelTest.testPreventNegativeStartColumn	1PASS
0.01608911	jalview.gui.QuitHandlerTest.testWaitForSaveQuitjalview.gui.QuitHandlerTest.testWaitForSaveQuit	1PASS
0.01608911	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.01608911	jalview.gui.ScalePanelTest.testBuildPopupMenujalview.gui.ScalePanelTest.testBuildPopupMenu	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_HiddenColumnsjalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_HiddenColumns	1PASS
0.01608911	jalview.gui.QuitHandlerTest.testForceQuitjalview.gui.QuitHandlerTest.testForceQuit	1PASS
0.01608911	jalview.gui.QuitHandlerTest.testNoGUIUnsavedChangesjalview.gui.QuitHandlerTest.testNoGUIUnsavedChanges	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.io.AnnotationExporterTest.testAnnotationExportAsCSVjalview.io.AnnotationExporterTest.testAnnotationExportAsCSV	1PASS
0.01608911	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.01608911	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.01608911	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01608911	jalview.gui.ColourMenuHelperTest.testAddMenuItems_forAlignFramejalview.gui.ColourMenuHelperTest.testAddMenuItems_forAlignFrame	1PASS
0.01608911	jalview.renderer.seqfeatures.FeatureRendererTest.testFindAllFeaturesjalview.renderer.seqfeatures.FeatureRendererTest.testFindAllFeatures	1PASS
0.01608911	jalview.renderer.seqfeatures.FeatureRendererTest.testFindComplementFeaturesAtResiduejalview.renderer.seqfeatures.FeatureRendererTest.testFindComplementFeaturesAtResidue	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testStoreAndRecoverNoOverviewjalview.project.Jalview2xmlTests.testStoreAndRecoverNoOverview	1PASS
0.01608911	jalview.io.FeaturesFileTest.testPrintGffFormatjalview.io.FeaturesFileTest.testPrintGffFormat	1PASS
0.01608911	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.01608911	jalview.gui.AlignFrameTest.testHideFeatureColumnsjalview.gui.AlignFrameTest.testHideFeatureColumns	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testStoreAndRecoverReferenceSeqSettingsjalview.project.Jalview2xmlTests.testStoreAndRecoverReferenceSeqSettings	1PASS
0.01608911	jalview.controller.AlignViewControllerTest.testSelectColumnsWithHighlightjalview.controller.AlignViewControllerTest.testSelectColumnsWithHighlight	1PASS
0.01608911	jalview.gui.PairwiseAlignmentPanelTest.testConstructor_noSelectionGroupjalview.gui.PairwiseAlignmentPanelTest.testConstructor_noSelectionGroup	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.ext.jmol.JmolCommandsTest.testGetColourBySequenceCommands_hiddenColumnsjalview.ext.jmol.JmolCommandsTest.testGetColourBySequenceCommands_hiddenColumns	1PASS
0.01608911	jalview.schemes.ClustalxColourSchemeTest.testFindColourjalview.schemes.ClustalxColourSchemeTest.testFindColour	1PASS
0.01608911	jalview.io.FeaturesFileTest.testPrintJalviewFormatjalview.io.FeaturesFileTest.testPrintJalviewFormat	1PASS
0.01608911	jalview.renderer.seqfeatures.FeatureRendererTest.testFindFeaturesAtColumnjalview.renderer.seqfeatures.FeatureRendererTest.testFindFeaturesAtColumn	1PASS
0.01608911	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.01608911	jalview.structures.models.AAStructureBindingModelTest.testBuildColoursMapjalview.structures.models.AAStructureBindingModelTest.testBuildColoursMap	1PASS
0.01608911	jalview.gui.QuitHandlerTest.testSavedAlignmentChangesjalview.gui.QuitHandlerTest.testSavedAlignmentChanges	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testMergeDatasetsforManyViewsjalview.project.Jalview2xmlTests.testMergeDatasetsforManyViews	1PASS
0.01608911	jalview.gui.FeatureSettingsTest.testSaveLoadjalview.gui.FeatureSettingsTest.testSaveLoad	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.io.gff.GffTests.testResolveExonerateGffjalview.io.gff.GffTests.testResolveExonerateGff	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testCopyViewSettingsjalview.project.Jalview2xmlTests.testCopyViewSettings	1PASS
0.01608911	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistances_withParamsjalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistances_withParams	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.gui.SeqPanelTest.testSetStatusReturnsNearestResiduePositionjalview.gui.SeqPanelTest.testSetStatusReturnsNearestResiduePosition	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testSaveLoadFeatureColoursAndFiltersjalview.project.Jalview2xmlTests.testSaveLoadFeatureColoursAndFilters	1PASS
0.01608911	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01608911	jalview.io.FeaturesFileTest.testParse_pureGff3jalview.io.FeaturesFileTest.testParse_pureGff3	1PASS
0.01608911	jalview.renderer.seqfeatures.FeatureRendererTest.testGetColourjalview.renderer.seqfeatures.FeatureRendererTest.testGetColour	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testStoreAndRecoverExpandedviewsjalview.project.Jalview2xmlTests.testStoreAndRecoverExpandedviews	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testPcaViewAssociationjalview.project.Jalview2xmlTests.testPcaViewAssociation	1PASS
0.01608911	jalview.gui.AlignViewportTest.testDeregisterMapping_withNoReferencejalview.gui.AlignViewportTest.testDeregisterMapping_withNoReference	1PASS
0.01608911	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.01608911	jalview.gui.AlignmentPanelTest.testSetOverviewTitle_automaticOverviewjalview.gui.AlignmentPanelTest.testSetOverviewTitle_automaticOverview	1PASS
0.01608911	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testStoreAndRecoverGroupRepSeqsjalview.project.Jalview2xmlTests.testStoreAndRecoverGroupRepSeqs	1PASS
0.01608911	jalview.gui.AlignViewportTest.testShowOrDontShowOccupancyjalview.gui.AlignViewportTest.testShowOrDontShowOccupancy	3FAIL
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01608911	jalview.gui.AlignViewportTest.testSetSelectionGroupjalview.gui.AlignViewportTest.testSetSelectionGroup	1PASS
0.01608911	jalview.analysis.AlignmentUtilsTests.testA3mInsertShiftsjalview.analysis.AlignmentUtilsTests.testA3mInsertShifts	1PASS
0.01608911	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.01608911	jalview.io.JSONFileTest.testBioJSONRoundTripWithColourSchemeNonejalview.io.JSONFileTest.testBioJSONRoundTripWithColourSchemeNone	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testStoreAndRecoverOverviewjalview.project.Jalview2xmlTests.testStoreAndRecoverOverview	1PASS
0.01608911	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.015470297	jalview.analysis.AlignmentUtilsTests.testFindCdsPositions_fivePrimeIncompletejalview.analysis.AlignmentUtilsTests.testFindCdsPositions_fivePrimeIncomplete	1PASS
0.01608911	jalview.gui.QuitHandlerTest.testSavedProjectChangesjalview.gui.QuitHandlerTest.testSavedProjectChanges	1PASS
0.01608911	jalview.project.Jalview2xmlTests.gatherViewsHerejalview.project.Jalview2xmlTests.gatherViewsHere	1PASS
0.01608911	jalview.gui.DesktopTests.testInternalCopyPastejalview.gui.DesktopTests.testInternalCopyPaste	1PASS
0.01608911	jalview.io.AnnotationFileIOTest.testCalcIdRestorejalview.io.AnnotationFileIOTest.testCalcIdRestore	1PASS
0.01608911	jalview.renderer.ScaleRendererTest.testCalculateMarksjalview.renderer.ScaleRendererTest.testCalculateMarks	1PASS
0.01608911	jalview.schemes.ColourSchemesTest.testGetColourSchemejalview.schemes.ColourSchemesTest.testGetColourScheme	1PASS
0.01608911	jalview.io.JSONFileTest.testGrpParsed_colourNonejalview.io.JSONFileTest.testGrpParsed_colourNone	1PASS
0.01608911	jalview.controller.AlignViewControllerTest.testFindColumnsWithFeaturejalview.controller.AlignViewControllerTest.testFindColumnsWithFeature	1PASS
0.01608911	jalview.gui.AlignViewportTest.testGetConsensusSeqjalview.gui.AlignViewportTest.testGetConsensusSeq	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.01608911	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModeljalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel	1PASS
0.01608911	jalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.SecondaryStructureDistanceModelTest.testFindDistances	1PASS
0.01608911	jalview.bin.CommandsTest.allLinkedIdsTestjalview.bin.CommandsTest.allLinkedIdsTest	1PASS
0.01608911	jalview.gui.ScalePanelTest.testSelectColumns_withHiddenjalview.gui.ScalePanelTest.testSelectColumns_withHidden	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testAutoShowOverviewForLegacyProjectsjalview.project.Jalview2xmlTests.testAutoShowOverviewForLegacyProjects	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testStoreAndRecoverGeneLocusjalview.project.Jalview2xmlTests.testStoreAndRecoverGeneLocus	1PASS
0.01608911	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistancesjalview.analysis.scoremodels.FeatureDistanceModelTest.testFindDistances	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testStoreAndRestoreIDwidthAndAnnotationHeightjalview.project.Jalview2xmlTests.testStoreAndRestoreIDwidthAndAnnotationHeight	1PASS
0.01608911	jalview.project.Jalview2xmlTests.testMergeDatasetsforViewsjalview.project.Jalview2xmlTests.testMergeDatasetsforViews	1PASS
0.01608911	jalview.project.Jalview2xmlTests.noDuplicatePdbMappingsMadejalview.project.Jalview2xmlTests.noDuplicatePdbMappingsMade	1PASS
0.01608911	jalview.schemes.PIDColourSchemeTest.testFindColour_ignoreGapsjalview.schemes.PIDColourSchemeTest.testFindColour_ignoreGaps	1PASS
0.014851485	jalview.io.vcf.VCFLoaderTest.testDoLoad_vepCsqjalview.io.vcf.VCFLoaderTest.testDoLoad_vepCsq	1PASS
0.015470297	jalview.analysis.AlignmentUtilsTests.testFindCdsForProteinjalview.analysis.AlignmentUtilsTests.testFindCdsForProtein	1PASS
0.01608911	jalview.gui.StructureChooserTest.openStructureFileForSequenceTestjalview.gui.StructureChooserTest.openStructureFileForSequenceTest	1PASS
0.01608911	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_hiddenFirstColumnjalview.analysis.scoremodels.FeatureDistanceModelTest.testFeatureScoreModel_hiddenFirstColumn	1PASS
0.01608911	jalview.gui.SeqPanelTest.testAmbiguousAminoAcidGetsStatusMessagejalview.gui.SeqPanelTest.testAmbiguousAminoAcidGetsStatusMessage	1PASS
0.01608911	jalview.io.AnnotationFileIOTest.testAnnotateAlignmentViewjalview.io.AnnotationFileIOTest.testAnnotateAlignmentView	1PASS
0.01608911	jalview.gui.AlignViewportTest.testDeregisterMapping_withReferencejalview.gui.AlignViewportTest.testDeregisterMapping_withReference	1PASS
0.01608911	jalview.io.FeaturesFileTest.testPrintJalviewFormat_withFiltersjalview.io.FeaturesFileTest.testPrintJalviewFormat_withFilters	1PASS
0.01608911	jalview.gui.AlignViewportTest.testUpdateConservation_qualityOnlyjalview.gui.AlignViewportTest.testUpdateConservation_qualityOnly	1PASS
0.01608911	jalview.renderer.seqfeatures.FeatureRendererTest.testFilterFeaturesForDisplayjalview.renderer.seqfeatures.FeatureRendererTest.testFilterFeaturesForDisplay	1PASS
0.01608911	jalview.bin.CommandsTest2.do_structureOpeningArgsTestjalview.bin.CommandsTest2.do_structureOpeningArgsTest	1PASS
0.01608911	jalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTestjalview.bin.CommandsTest.argFilesGlobAndSubstitutionsTest	1PASS
0.01608911	jalview.datamodel.AlignmentViewTest.testGetVisibleContigsjalview.datamodel.AlignmentViewTest.testGetVisibleContigs	1PASS
0.01608911	jalview.bin.CommandsTest.commandsOpenTestjalview.bin.CommandsTest.commandsOpenTest	1PASS
0.014851485	jalview.io.vcf.VCFLoaderTest.testDoLoadjalview.io.vcf.VCFLoaderTest.testDoLoad	1PASS
0.014851485	jalview.gui.AlignViewportTest.testDeregisterMapping_onCloseViewjalview.gui.AlignViewportTest.testDeregisterMapping_onCloseView	1PASS
0.014851485	jalview.io.BackupFilesTest.backupsEnabledNoRollMaxTestjalview.io.BackupFilesTest.backupsEnabledNoRollMaxTest	1PASS
0.014851485	jalview.io.BackupFilesTest.backupsEnabledSingleFileBackupTestjalview.io.BackupFilesTest.backupsEnabledSingleFileBackupTest	1PASS
0.014851485	jalview.io.BackupFilesTest.noBackupsEnabledTestjalview.io.BackupFilesTest.noBackupsEnabledTest	1PASS
0.014851485	jalview.gui.SeqPanelTest.testFindMousePosition_wrapped_scales_longSequencejalview.gui.SeqPanelTest.testFindMousePosition_wrapped_scales_longSequence	1PASS
0.014851485	jalview.io.BackupFilesTest.backupsEnabledReverseRollMaxTestjalview.io.BackupFilesTest.backupsEnabledReverseRollMaxTest	1PASS
0.014851485	jalview.io.BackupFilesTest.backupsEnabledRollMaxTestjalview.io.BackupFilesTest.backupsEnabledRollMaxTest	1PASS
0.014851485	jalview.analysis.scoremodels.FeatureDistanceModelTest.testFindFeatureAt_PointFeaturejalview.analysis.scoremodels.FeatureDistanceModelTest.testFindFeatureAt_PointFeature	1PASS
0.014851485	jalview.io.vcf.VCFLoaderTest.testDoLoad_reverseStrandjalview.io.vcf.VCFLoaderTest.testDoLoad_reverseStrand	1PASS
0.014851485	jalview.schemes.ClustalxColourSchemeTest.testFindColour_ignoreGapsjalview.schemes.ClustalxColourSchemeTest.testFindColour_ignoreGaps	1PASS
0.013613861	jalview.gui.AnnotationChooserTest.testIsInActionScope_selectedScopejalview.gui.AnnotationChooserTest.testIsInActionScope_selectedScope	1PASS
0.013613861	jalview.io.AnnotationFileIOTest.exampleAnnotationFileIOjalview.io.AnnotationFileIOTest.exampleAnnotationFileIO	1PASS
0.013613861	jalview.gui.AnnotationChooserTest.testSelectType_hideForSelectedjalview.gui.AnnotationChooserTest.testSelectType_hideForSelected	1PASS
0.013613861	jalview.gui.AnnotationChooserTest.testDeselectType_showForSelectedjalview.gui.AnnotationChooserTest.testDeselectType_showForSelected	1PASS
0.012376238	jalview.schemes.ResidueColourSchemeTest.testIsApplicableTo_dynamicColourSchemejalview.schemes.ResidueColourSchemeTest.testIsApplicableTo_dynamicColourScheme	1PASS
0.012376238	jalview.workers.AlignCaclManager2Test.testIsWorkingWithAnnotationjalview.workers.AlignCaclManager2Test.testIsWorkingWithAnnotation	1PASS
0.012995049	jalview.analysis.AlignmentUtilsTests.testGetAlignmentAnnotationForSourcejalview.analysis.AlignmentUtilsTests.testGetAlignmentAnnotationForSource	1PASS
0.013613861	jalview.gui.AnnotationChooserTest.testDeselectType_hideForAlljalview.gui.AnnotationChooserTest.testDeselectType_hideForAll	1PASS
0.013613861	jalview.gui.AnnotationChooserTest.testDeselectType_showForAlljalview.gui.AnnotationChooserTest.testDeselectType_showForAll	1PASS
0.013613861	jalview.gui.AnnotationChooserTest.testSelectType_showForAlljalview.gui.AnnotationChooserTest.testSelectType_showForAll	1PASS
0.012376238	jalview.schemes.AnnotationColourGradientTest.testFindColour_aboveThresholdjalview.schemes.AnnotationColourGradientTest.testFindColour_aboveThreshold	1PASS
0.012376238	jalview.workers.AlignCaclManager2Test.testRestartCompletedWorkersjalview.workers.AlignCaclManager2Test.testRestartCompletedWorkers	1PASS
0.011757426	jalview.analysis.AlignmentUtilsTests.testFindCdsPositionsjalview.analysis.AlignmentUtilsTests.testFindCdsPositions	1PASS
0.012376238	jalview.workers.AlignCaclManager2Test.testRestartCancelsWorkersjalview.workers.AlignCaclManager2Test.testRestartCancelsWorkers	1PASS
0.012376238	jalview.workers.AlignCaclManager2Test.testStartOneShotWorkerjalview.workers.AlignCaclManager2Test.testStartOneShotWorker	1PASS
0.012376238	jalview.analysis.AlignmentUtilsTests.testHasCrossRefjalview.analysis.AlignmentUtilsTests.testHasCrossRef	1PASS
0.012376238	jalview.analysis.AlignmentUtilsTests.testHaveCrossRefjalview.analysis.AlignmentUtilsTests.testHaveCrossRef	1PASS
0.012376238	jalview.workers.AlignCaclManager2Test.restartOneShotWorkerjalview.workers.AlignCaclManager2Test.restartOneShotWorker	1PASS
0.012376238	jalview.workers.AlignCaclManager2Test.testRestartDisabledWorkerjalview.workers.AlignCaclManager2Test.testRestartDisabledWorker	3FAIL
0.012376238	jalview.io.cache.JvCacheableInputBoxTest.updateCacheTestjalview.io.cache.JvCacheableInputBoxTest.updateCacheTest	1PASS
0.010519802	jalview.gui.SeqPanelTest.testFindColumn_unwrappedjalview.gui.SeqPanelTest.testFindColumn_unwrapped	1PASS
0.010519802	jalview.io.JalviewExportPropertiesTests.testImportExportPeriodGapsjalview.io.JalviewExportPropertiesTests.testImportExportPeriodGaps	1PASS
0.010519802	jalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsAndHiddenColumnsjalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsAndHiddenColumns	1PASS
0.010519802	jalview.util.MappingUtilsTest.testMapSequenceGroup_sharedDatasetjalview.util.MappingUtilsTest.testMapSequenceGroup_sharedDataset	1PASS
0.010519802	jalview.gui.PairwiseAlignmentPanelTest.testConstructor_withSelectionGroupjalview.gui.PairwiseAlignmentPanelTest.testConstructor_withSelectionGroup	1PASS
0.010519802	jalview.io.gff.ExonerateHelperTest.testAddExonerateGffToAlignmentjalview.io.gff.ExonerateHelperTest.testAddExonerateGffToAlignment	1PASS
0.010519802	jalview.renderer.seqfeatures.FeatureRendererTest.testIsVisiblejalview.renderer.seqfeatures.FeatureRendererTest.testIsVisible	1PASS
0.010519802	jalview.gui.AlignViewportTest.testSetGetHasSearchResultsjalview.gui.AlignViewportTest.testSetGetHasSearchResults	1PASS
0.010519802	jalview.gui.SeqPanelTest.testFindMousePosition_wrapped_annotationsjalview.gui.SeqPanelTest.testFindMousePosition_wrapped_annotations	1PASS
0.010519802	jalview.io.FeaturesFileTest.testParse_mixedJalviewGffjalview.io.FeaturesFileTest.testParse_mixedJalviewGff	1PASS
0.010519802	jalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_zappojalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_zappo	1PASS
0.010519802	jalview.ws2.actions.alignment.AlignmentActionTest.submitSequences_submitGapsOff_verifySequencesSubmittedWithoutGapsjalview.ws2.actions.alignment.AlignmentActionTest.submitSequences_submitGapsOff_verifySequencesSubmittedWithoutGaps	1PASS
0.010519802	jalview.ws2.actions.alignment.AlignmentActionListenerNotifiedTest.submitSequences_submitGapsOff_verifySequencesSubmittedWithoutGapsjalview.ws2.actions.alignment.AlignmentActionListenerNotifiedTest.submitSequences_submitGapsOff_verifySequencesSubmittedWithoutGaps	1PASS
0.010519802	jalview.schemes.ColourSchemesTest.testRegisterColourSchemejalview.schemes.ColourSchemesTest.testRegisterColourScheme	1PASS
0.010519802	jalview.ws2.actions.alignment.AlignmentActionTest.retrieveResult_verifySequencesAlignedjalview.ws2.actions.alignment.AlignmentActionTest.retrieveResult_verifySequencesAligned	1PASS
0.010519802	jalview.ws2.actions.alignment.AlignmentActionListenerNotifiedTest.submitSequences_submitGapsOn_verifySequencesSubmittedWithGapsjalview.ws2.actions.alignment.AlignmentActionListenerNotifiedTest.submitSequences_submitGapsOn_verifySequencesSubmittedWithGaps	1PASS
0.010519802	jalview.datamodel.HiddenSequencesTest.testHideShowSequence_withHiddenRepSequencejalview.datamodel.HiddenSequencesTest.testHideShowSequence_withHiddenRepSequence	1PASS
0.010519802	jalview.gui.AlignmentPanelTest.testSetOverviewTitlejalview.gui.AlignmentPanelTest.testSetOverviewTitle	1PASS
0.010519802	jalview.ws2.actions.alignment.AlignmentActionListenerNotifiedTest.retrieveResult_verifySequencesAlignedjalview.ws2.actions.alignment.AlignmentActionListenerNotifiedTest.retrieveResult_verifySequencesAligned	1PASS
0.010519802	jalview.gui.AlignViewportTest.testSetGlobalColourSchemejalview.gui.AlignViewportTest.testSetGlobalColourScheme	1PASS
0.010519802	jalview.util.MappingUtilsTest.testMapColumnSelection_nulljalview.util.MappingUtilsTest.testMapColumnSelection_null	1PASS
0.010519802	jalview.util.MappingUtilsTest.testMapSequenceGroup_columnsjalview.util.MappingUtilsTest.testMapSequenceGroup_columns	1PASS
0.010519802	jalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_nonejalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_none	1PASS
0.011138614	jalview.analysis.AlignmentUtilsTests.testIsSSAnnotationPresentjalview.analysis.AlignmentUtilsTests.testIsSSAnnotationPresent	1PASS
0.010519802	jalview.renderer.ResidueColourFinderTest.testGetResidueColour_zappojalview.renderer.ResidueColourFinderTest.testGetResidueColour_zappo	1PASS
0.010519802	jalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_userdefjalview.renderer.OverviewResColourFinderTest.testGetResidueBoxColour_userdef	1PASS
0.010519802	jalview.renderer.ResidueColourFinderTest.testGetResidueColour_nonejalview.renderer.ResidueColourFinderTest.testGetResidueColour_none	1PASS
0.010519802	jalview.gui.AlignFrameTest.testNewView_dsRefPreservedjalview.gui.AlignFrameTest.testNewView_dsRefPreserved	1PASS
0.010519802	jalview.util.MappingUtilsTest.testMapColumnSelection_dnaToProteinjalview.util.MappingUtilsTest.testMapColumnSelection_dnaToProtein	1PASS
0.010519802	jalview.analysis.FinderTest.testFindAll_sequenceIdsjalview.analysis.FinderTest.testFindAll_sequenceIds	1PASS
0.010519802	jalview.io.FeaturesFileTest.testParse_jalviewFeaturesOnlyjalview.io.FeaturesFileTest.testParse_jalviewFeaturesOnly	1PASS
0.010519802	jalview.analysis.FinderTest.testFind_inDescriptionjalview.analysis.FinderTest.testFind_inDescription	1PASS
0.010519802	jalview.ws2.actions.alignment.AlignmentActionTest.submitSequences_verifySequenceNamesUniquifiedjalview.ws2.actions.alignment.AlignmentActionTest.submitSequences_verifySequenceNamesUniquified	1PASS
0.010519802	jalview.gui.SeqPanelTest.testFindMousePosition_wrapped_noAnnotationsjalview.gui.SeqPanelTest.testFindMousePosition_wrapped_noAnnotations	1PASS
0.011138614	jalview.datamodel.PAEContactMatrixTest.testSeqAssociatedPAEMatrixjalview.datamodel.PAEContactMatrixTest.testSeqAssociatedPAEMatrix	1PASS
0.010519802	jalview.gui.SeqPanelTest.testFindColumn_and_FindAlignmentColumn_wrappedjalview.gui.SeqPanelTest.testFindColumn_and_FindAlignmentColumn_wrapped	1PASS
0.010519802	jalview.renderer.ResidueColourFinderTest.testGetResidueColour_userdefjalview.renderer.ResidueColourFinderTest.testGetResidueColour_userdef	1PASS
0.010519802	jalview.gui.PaintRefresherTest.testGetAssociatedPanelsjalview.gui.PaintRefresherTest.testGetAssociatedPanels	1PASS
0.010519802	jalview.gui.QuitHandlerTest.testInstantQuitjalview.gui.QuitHandlerTest.testInstantQuit	1PASS
0.011138614	jalview.analysis.AlignmentUtilsTests.testIsSSAnnotationPresentjalview.analysis.AlignmentUtilsTests.testIsSSAnnotationPresent	1PASS
0.010519802	jalview.util.MappingUtilsTest.testMapSequenceGroup_regionjalview.util.MappingUtilsTest.testMapSequenceGroup_region	1PASS
0.010519802	jalview.ws2.actions.alignment.AlignmentActionListenerNotifiedTest.submitSequences_verifySequenceNamesUniquifiedjalview.ws2.actions.alignment.AlignmentActionListenerNotifiedTest.submitSequences_verifySequenceNamesUniquified	1PASS
0.00990099	jalview.analysis.AlignmentUtilsTests.testIsSSAnnotationPresentjalview.analysis.AlignmentUtilsTests.testIsSSAnnotationPresent	1PASS
0.010519802	jalview.analysis.DnaTest.testReverseCdnajalview.analysis.DnaTest.testReverseCdna	1PASS
0.010519802	jalview.io.FeaturesFileTest.testPrintGffFormat_withFiltersjalview.io.FeaturesFileTest.testPrintGffFormat_withFilters	1PASS
0.010519802	jalview.util.MappingUtilsTest.testMapSequenceGroup_sequencesjalview.util.MappingUtilsTest.testMapSequenceGroup_sequences	1PASS
0.010519802	jalview.util.MappingUtilsTest.testMapColumnSelection_hiddenColumnsjalview.util.MappingUtilsTest.testMapColumnSelection_hiddenColumns	1PASS
0.010519802	jalview.ws2.actions.alignment.AlignmentActionTest.submitSequences_submitGapsOn_verifySequencesSubmittedWithGapsjalview.ws2.actions.alignment.AlignmentActionTest.submitSequences_submitGapsOn_verifySequencesSubmittedWithGaps	1PASS
0.010519802	jalview.util.MappingUtilsTest.testMapColumnSelection_proteinToDnajalview.util.MappingUtilsTest.testMapColumnSelection_proteinToDna	1PASS
0.010519802	jalview.gui.SeqPanelTest.testFindMousePosition_wrapped_scaleAbovejalview.gui.SeqPanelTest.testFindMousePosition_wrapped_scaleAbove	1PASS
0.010519802	jalview.io.WindowsFileLoadAndSaveTest.loadAndSaveAlignmentjalview.io.WindowsFileLoadAndSaveTest.loadAndSaveAlignment	1PASS
0.008044555	jalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSourcesjalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSources	1PASS
0.008663367	jalview.analysis.AlignmentUtilsTests.testTransferGeneLocijalview.analysis.AlignmentUtilsTests.testTransferGeneLoci	1PASS
0.009282178	jalview.datamodel.SequenceGroupTest.testHasSecondaryStructureAnnotationjalview.datamodel.SequenceGroupTest.testHasSecondaryStructureAnnotation	1PASS
0.0068069305	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_noReferenceAnnotationsjalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_noReferenceAnnotations	1PASS
0.0068069305	jalview.analysis.AnnotationSorterTest.testNoSort_autocalcFirstjalview.analysis.AnnotationSorterTest.testNoSort_autocalcFirst	1PASS
0.0068069305	jalview.io.BSMLFileTest.testParse_BSMLjalview.io.BSMLFileTest.testParse_BSML	1PASS
0.0074257427	jalview.analysis.AlignmentUtilsTests.testShowOrHideSequenceAnnotationsjalview.analysis.AlignmentUtilsTests.testShowOrHideSequenceAnnotations	1PASS
0.008044555	jalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSourcesjalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSources	1PASS
0.008044555	jalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSourcesjalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSources	1PASS
0.008044555	jalview.datamodel.AlignmentTest.testIsSecondaryStructurePresentjalview.datamodel.AlignmentTest.testIsSecondaryStructurePresent	1PASS
0.008663367	jalview.analysis.AlignmentUtilsTests.testGetSequencesByNamejalview.analysis.AlignmentUtilsTests.testGetSequencesByName	1PASS
0.0068069305	jalview.analysis.AnnotationSorterTest.testSortByTypeAndSequence_autocalcFirstjalview.analysis.AnnotationSorterTest.testSortByTypeAndSequence_autocalcFirst	1PASS
0.0068069305	jalview.analysis.AnnotationSorterTest.testSort_timingPresortedjalview.analysis.AnnotationSorterTest.testSort_timingPresorted	1PASS
0.0068069305	jalview.gui.AnnotationColumnChooserTest.testResetjalview.gui.AnnotationColumnChooserTest.testReset	1PASS
0.0068069305	jalview.analysis.AnnotationSorterTest.testSort_timingSemisortedjalview.analysis.AnnotationSorterTest.testSort_timingSemisorted	1PASS
0.0068069305	jalview.analysis.AnnotationSorterTest.testSortBySequenceAndType_autocalcFirstjalview.analysis.AnnotationSorterTest.testSortBySequenceAndType_autocalcFirst	1PASS
0.0068069305	jalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSourcesjalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSources	1PASS
0.0068069305	jalview.analysis.AnnotationSorterTest.testSortBySequenceAndType_autocalcLastjalview.analysis.AnnotationSorterTest.testSortBySequenceAndType_autocalcLast	1PASS
0.0068069305	jalview.analysis.AnnotationSorterTest.testSortByTypeAndSequence_autocalcLastjalview.analysis.AnnotationSorterTest.testSortByTypeAndSequence_autocalcLast	1PASS
0.0068069305	jalview.analysis.AnnotationSorterTest.testSort_timingUnsortedjalview.analysis.AnnotationSorterTest.testSort_timingUnsorted	1PASS
0.005569307	jalview.analysis.scoremodels.PIDModelTest.testComputePID_matchLongestSequencejalview.analysis.scoremodels.PIDModelTest.testComputePID_matchLongestSequence	1PASS
0.005569307	jalview.analysis.GroupingTest.testMakeGroupsWithBothjalview.analysis.GroupingTest.testMakeGroupsWithBoth	1PASS
0.004950495	jalview.analysis.AlignmentUtilsTests.testSecondaryStructureAnnotationColourjalview.analysis.AlignmentUtilsTests.testSecondaryStructureAnnotationColour	1PASS
0.004950495	jalview.analysis.AlignmentUtilsTests.testSecondaryStructureAnnotationColourjalview.analysis.AlignmentUtilsTests.testSecondaryStructureAnnotationColour	1PASS
0.0030940594	jalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSourcesjalview.analysis.AlignmentUtilsTests.testSecondaryStructurePresentAndSources	1PASS
0.0037128713	jalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_noSequenceSelectedjalview.gui.PopupMenuTest.testConfigureReferenceAnnotationsMenu_noSequenceSelected	1PASS
0.0037128713	jalview.analysis.AlignmentUtilsTests.testSecondaryStructureAnnotationColourjalview.analysis.AlignmentUtilsTests.testSecondaryStructureAnnotationColour	1PASS
0.0024752475	jalview.analysis.DnaTest.testTranslateCdna_hiddenColumnsjalview.analysis.DnaTest.testTranslateCdna_hiddenColumns	1PASS
0.0024752475	jalview.analysis.AlignmentUtilsTests.testSecondaryStructureAnnotationColourjalview.analysis.AlignmentUtilsTests.testSecondaryStructureAnnotationColour	1PASS
0.0024752475	jalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsjalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodons	1PASS
0.0024752475	jalview.analysis.DnaTest.testTranslateCdna_simplejalview.analysis.DnaTest.testTranslateCdna_simple	1PASS
0.0024752475	jalview.analysis.DnaTest.testTranslateCdna_sequenceOrderIndependentjalview.analysis.DnaTest.testTranslateCdna_sequenceOrderIndependent	1PASS
0.0018564357	jalview.analysis.AlignmentUtilsTests.testIsSSAnnotationPresentjalview.analysis.AlignmentUtilsTests.testIsSSAnnotationPresent	1PASS

Source view

* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)

* Copyright (C) $$Year-Rel$$ The Jalview Authors

* This file is part of Jalview.

* Jalview is free software: you can redistribute it and/or

* modify it under the terms of the GNU General Public License

* as published by the Free Software Foundation, either version 3

* of the License, or (at your option) any later version.

* Jalview is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty

* of MERCHANTABILITY or FITNESS FOR A PARTICULAR

* PURPOSE. See the GNU General Public License for more details.

* You should have received a copy of the GNU General Public License

* along with Jalview. If not, see <http://www.gnu.org/licenses/>.

* The Jalview Authors are detailed in the 'AUTHORS' file.

package jalview.analysis;

import java.awt.Color;

import java.util.ArrayList;

import java.util.Arrays;

import java.util.Collection;

import java.util.Collections;

import java.util.HashMap;

import java.util.HashSet;

import java.util.Iterator;

import java.util.LinkedHashMap;

import java.util.List;

import java.util.Locale;

import java.util.Map;

import java.util.Map.Entry;

import java.util.NoSuchElementException;

import java.util.Set;

import java.util.SortedMap;

import java.util.TreeMap;

import java.util.Vector;

import java.util.stream.Collectors;

import jalview.bin.Console;

import jalview.commands.RemoveGapColCommand;

import jalview.datamodel.AlignedCodon;

import jalview.datamodel.AlignedCodonFrame;

import jalview.datamodel.AlignedCodonFrame.SequenceToSequenceMapping;

import jalview.datamodel.Alignment;

import jalview.datamodel.AlignmentAnnotation;

import jalview.datamodel.AlignmentI;

import jalview.datamodel.Annotation;

import jalview.datamodel.ContactMatrixI;

import jalview.datamodel.DBRefEntry;

import jalview.datamodel.DBRefSource;

import jalview.datamodel.GeneLociI;

import jalview.datamodel.HiddenColumns;

import jalview.datamodel.IncompleteCodonException;

import jalview.datamodel.Mapping;

import jalview.datamodel.PDBEntry;

import jalview.datamodel.Sequence;

import jalview.datamodel.SequenceFeature;

import jalview.datamodel.SequenceGroup;

import jalview.datamodel.SequenceI;

import jalview.datamodel.features.SequenceFeatures;

import jalview.io.gff.SequenceOntologyI;

import jalview.schemes.ResidueProperties;

import jalview.util.ColorUtils;

import jalview.util.Comparison;

import jalview.util.Constants;

import jalview.util.DBRefUtils;

import jalview.util.IntRangeComparator;

import jalview.util.MapList;

import jalview.util.MappingUtils;

import jalview.util.ShiftList;

import uk.ac.vamsas.objects.core.descriptors.NewickDescriptor;

/**

* grab bag of useful alignment manipulation operations Expect these to be

* refactored elsewhere at some point.

* @author jimp

public class AlignmentUtils

{

private static final int CODON_LENGTH = 3;

private static final String SEQUENCE_VARIANT = "sequence_variant:";

* the 'id' attribute is provided for variant features fetched from

* Ensembl using its REST service with JSON format

public static final String VARIANT_ID = "id";

/**

* A data model to hold the 'normal' base value at a position, and an optional

* sequence variant feature

100

static final class DnaVariant

{

final String base;

SequenceFeature variant;

105

106

DnaVariant(String nuc)

{

base = nuc;

variant = null;

}

DnaVariant(String nuc, SequenceFeature var)

{

base = nuc;

variant = var;

}

public String getSource()

119

{

120

return variant == null ? null : variant.getFeatureGroup();

}

/**

* toString for aid in the debugger only

125

126

@Override

127

public String toString()

128

{

129

return base + ":" + (variant == null ? "" : variant.getDescription());

}

}

/**

* given an existing alignment, create a new alignment including all, or up to

135

* flankSize additional symbols from each sequence's dataset sequence

* @param core

* @param flankSize

* @return AlignmentI

public static AlignmentI expandContext(AlignmentI core, int flankSize)

142

{

143

List<SequenceI> sq = new ArrayList<>();

144

int maxoffset = 0;

145

for (SequenceI s : core.getSequences())

146

{

147

131

SequenceI newSeq = s.deriveSequence();

148

131

final int newSeqStart = newSeq.getStart() - 1;

149

131

if (newSeqStart > maxoffset

150

&& newSeq.getDatasetSequence().getStart() < s.getStart())

151

{

152

131

maxoffset = newSeqStart;

153

}

154

131

sq.add(newSeq);

}

if (flankSize > -1)

{

maxoffset = Math.min(maxoffset, flankSize);

}

* now add offset left and right to create an expanded alignment

163

164

for (SequenceI s : sq)

165

{

166

131

SequenceI ds = s;

167

262

while (ds.getDatasetSequence() != null)

168

{

169

131

ds = ds.getDatasetSequence();

170

}

171

131

int s_end = s.findPosition(s.getStart() + s.getLength());

172

// find available flanking residues for sequence

173

131

int ustream_ds = s.getStart() - ds.getStart();

174

131

int dstream_ds = ds.getEnd() - s_end;

175

176

// build new flanked sequence

177

178

// compute gap padding to start of flanking sequence

179

131

int offset = maxoffset - ustream_ds;

180

181

// padding is gapChar x ( maxoffset - min(ustream_ds, flank)

182

131

if (flankSize >= 0)

183

{

184

125

if (flankSize < ustream_ds)

185

{

186

// take up to flankSize residues

187

offset = maxoffset - flankSize;

188

ustream_ds = flankSize;

189

}

190

125

if (flankSize <= dstream_ds)

191

{

192

116

dstream_ds = flankSize - 1;

193

}

194

}

195

// TODO use Character.toLowerCase to avoid creating String objects?

196

131

char[] upstream = new String(ds

197

.getSequence(s.getStart() - 1 - ustream_ds, s.getStart() - 1))

198

.toLowerCase(Locale.ROOT).toCharArray();

199

131

char[] downstream = new String(

200

ds.getSequence(s_end - 1, s_end + dstream_ds))

201

.toLowerCase(Locale.ROOT).toCharArray();

202

131

char[] coreseq = s.getSequence();

203

131

char[] nseq = new char[offset + upstream.length + downstream.length

204

+ coreseq.length];

205

131

char c = core.getGapCharacter();

206

207

131

int p = 0;

208

461

for (; p < offset; p++)

209

{

210

330

nseq[p] = c;

211

}

212

213

131

System.arraycopy(upstream, 0, nseq, p, upstream.length);

214

131

System.arraycopy(coreseq, 0, nseq, p + upstream.length,

215

coreseq.length);

216

131

System.arraycopy(downstream, 0, nseq,

217

p + coreseq.length + upstream.length, downstream.length);

218

131

s.setSequence(new String(nseq));

219

131

s.setStart(s.getStart() - ustream_ds);

220

131

s.setEnd(s_end + downstream.length);

221

}

222

AlignmentI newAl = new jalview.datamodel.Alignment(

223

sq.toArray(new SequenceI[0]));

224

for (SequenceI s : sq)

225

{

226

131

if (s.getAnnotation() != null)

227

{

228

for (AlignmentAnnotation aa : s.getAnnotation())

229

{

230

aa.adjustForAlignment(); // JAL-1712 fix

231

newAl.addAnnotation(aa);

}

}

}

newAl.setDataset(core.getDataset());

return newAl;

}

/**

* Returns the index (zero-based position) of a sequence in an alignment, or

* -1 if not found.

* @param al

* @param seq

* @return

64304

public static int getSequenceIndex(AlignmentI al, SequenceI seq)

248

{

249

64304

int result = -1;

250

64304

int pos = 0;

251

64304

for (SequenceI alSeq : al.getSequences())

252

{

253

126221607

if (alSeq == seq)

254

{

255

64241

result = pos;

256

64241

break;

257

}

258

126157362

pos++;

259

}

260

64302

return result;

}

/**

* Returns a map of lists of sequences in the alignment, keyed by sequence

265

* name. For use in mapping between different alignment views of the same

266

* sequences.

267

268

* @see jalview.datamodel.AlignmentI#getSequencesByName()

269

270

public static Map<String, List<SequenceI>> getSequencesByName(

271

AlignmentI al)

272

{

273

Map<String, List<SequenceI>> theMap = new LinkedHashMap<>();

274

for (SequenceI seq : al.getSequences())

275

{

276

String name = seq.getName();

277

if (name != null)

278

{

279

List<SequenceI> seqs = theMap.get(name);

280

if (seqs == null)

281

{

282

seqs = new ArrayList<>();

283

theMap.put(name, seqs);

}

seqs.add(seq);

}

}

return theMap;

}

/**

* Build mapping of protein to cDNA alignment. Mappings are made between

293

* sequences where the cDNA translates to the protein sequence. Any new

294

* mappings are added to the protein alignment. Returns true if any mappings

295

* either already exist or were added, else false.

296

297

* @param proteinAlignment

298

* @param cdnaAlignment

299

* @return

300

301

public static boolean mapProteinAlignmentToCdna(

302

final AlignmentI proteinAlignment, final AlignmentI cdnaAlignment)

303

{

304

if (proteinAlignment == null || cdnaAlignment == null)

{

return false;

}

Set<SequenceI> mappedDna = new HashSet<>();

310

Set<SequenceI> mappedProtein = new HashSet<>();

311

312

313

* First pass - map sequences where cross-references exist. This include

314

* 1-to-many mappings to support, for example, variant cDNA.

315

316

boolean mappingPerformed = mapProteinToCdna(proteinAlignment,

317

cdnaAlignment, mappedDna, mappedProtein, true);

318

319

320

* Second pass - map sequences where no cross-references exist. This only

321

* does 1-to-1 mappings and assumes corresponding sequences are in the same

322

* order in the alignments.

323

324

mappingPerformed |= mapProteinToCdna(proteinAlignment, cdnaAlignment,

325

mappedDna, mappedProtein, false);

326

return mappingPerformed;

}

/**

* Make mappings between compatible sequences (where the cDNA translation

331

* matches the protein).

332

333

* @param proteinAlignment

334

* @param cdnaAlignment

335

* @param mappedDna

336

* a set of mapped DNA sequences (to add to)

337

* @param mappedProtein

338

* a set of mapped Protein sequences (to add to)

339

* @param xrefsOnly

340

* if true, only map sequences where xrefs exist

341

* @return

342

343

protected static boolean mapProteinToCdna(

344

final AlignmentI proteinAlignment, final AlignmentI cdnaAlignment,

345

Set<SequenceI> mappedDna, Set<SequenceI> mappedProtein,

346

boolean xrefsOnly)

347

{

348

boolean mappingExistsOrAdded = false;

349

List<SequenceI> thisSeqs = proteinAlignment.getSequences();

350

for (SequenceI aaSeq : thisSeqs)

351

{

352

boolean proteinMapped = false;

353

AlignedCodonFrame acf = new AlignedCodonFrame();

354

355

for (SequenceI cdnaSeq : cdnaAlignment.getSequences())

356

{

357

358

* Always try to map if sequences have xref to each other; this supports

359

* variant cDNA or alternative splicing for a protein sequence.

360

361

* If no xrefs, try to map progressively, assuming that alignments have

362

* mappable sequences in corresponding order. These are not

363

* many-to-many, as that would risk mixing species with similar cDNA

364

* sequences.

365

366

if (xrefsOnly && !AlignmentUtils.haveCrossRef(aaSeq, cdnaSeq))

{

continue;

}

* Don't map non-xrefd sequences more than once each. This heuristic

373

* allows us to pair up similar sequences in ordered alignments.

374

375

if (!xrefsOnly && (mappedProtein.contains(aaSeq)

376

|| mappedDna.contains(cdnaSeq)))

{

continue;

}

if (mappingExists(proteinAlignment.getCodonFrames(),

381

aaSeq.getDatasetSequence(), cdnaSeq.getDatasetSequence()))

382

{

383

mappingExistsOrAdded = true;

}

else

{

MapList map = mapCdnaToProtein(aaSeq, cdnaSeq);

388

if (map != null)

389

{

390

acf.addMap(cdnaSeq, aaSeq, map);

391

mappingExistsOrAdded = true;

392

proteinMapped = true;

393

mappedDna.add(cdnaSeq);

394

mappedProtein.add(aaSeq);

}

}

}

if (proteinMapped)

{

proteinAlignment.addCodonFrame(acf);

401

}

402

}

403

return mappingExistsOrAdded;

}

/**

* Answers true if the mappings include one between the given (dataset)

408

* sequences.

409

410

protected static boolean mappingExists(List<AlignedCodonFrame> mappings,

411

SequenceI aaSeq, SequenceI cdnaSeq)

412

{

413

if (mappings != null)

414

{

415

for (AlignedCodonFrame acf : mappings)

416

{

417

if (cdnaSeq == acf.getDnaForAaSeq(aaSeq))

{

return true;

}

}

}

return false;

}

/**

* Builds a mapping (if possible) of a cDNA to a protein sequence.

428

* <ul>

429

* <li>first checks if the cdna translates exactly to the protein

430

* sequence</li>

431

* <li>else checks for translation after removing a STOP codon</li>

432

* <li>else checks for translation after removing a START codon</li>

433

* <li>if that fails, inspect CDS features on the cDNA sequence</li>

434

* </ul>

435

* Returns null if no mapping is determined.

436

437

* @param proteinSeq

438

* the aligned protein sequence

439

* @param cdnaSeq

440

* the aligned cdna sequence

441

* @return

442

443

public static MapList mapCdnaToProtein(SequenceI proteinSeq,

SequenceI cdnaSeq)

{

* Here we handle either dataset sequence set (desktop) or absent (applet).

448

* Use only the char[] form of the sequence to avoid creating possibly large

449

* String objects.

450

451

final SequenceI proteinDataset = proteinSeq.getDatasetSequence();

452

char[] aaSeqChars = proteinDataset != null

453

? proteinDataset.getSequence()

454

: proteinSeq.getSequence();

455

final SequenceI cdnaDataset = cdnaSeq.getDatasetSequence();

456

char[] cdnaSeqChars = cdnaDataset != null ? cdnaDataset.getSequence()

457

: cdnaSeq.getSequence();

458

if (aaSeqChars == null || cdnaSeqChars == null)

{

return null;

}

* cdnaStart/End, proteinStartEnd are base 1 (for dataset sequence mapping)

465

466

final int mappedLength = CODON_LENGTH * aaSeqChars.length;

467

int cdnaLength = cdnaSeqChars.length;

468

int cdnaStart = cdnaSeq.getStart();

469

int cdnaEnd = cdnaSeq.getEnd();

470

final int proteinStart = proteinSeq.getStart();

471

final int proteinEnd = proteinSeq.getEnd();

472

473

474

* If lengths don't match, try ignoring stop codon (if present)

475

476

if (cdnaLength != mappedLength && cdnaLength > 2)

477

{

478

String lastCodon = String.valueOf(cdnaSeqChars,

479

cdnaLength - CODON_LENGTH, CODON_LENGTH)

480

.toUpperCase(Locale.ROOT);

481

for (String stop : ResidueProperties.STOP_CODONS)

482

{

483

if (lastCodon.equals(stop))

484

{

485

cdnaEnd -= CODON_LENGTH;

486

cdnaLength -= CODON_LENGTH;

break;

}

}

}

* If lengths still don't match, try ignoring start codon.

494

495

int startOffset = 0;

496

if (cdnaLength != mappedLength && cdnaLength > 2

497

&& String.valueOf(cdnaSeqChars, 0, CODON_LENGTH)

498

.toUpperCase(Locale.ROOT)

499

.equals(ResidueProperties.START))

500

{

501

startOffset += CODON_LENGTH;

502

cdnaStart += CODON_LENGTH;

503

cdnaLength -= CODON_LENGTH;

504

}

505

506

if (translatesAs(cdnaSeqChars, startOffset, aaSeqChars))

507

{

508

509

* protein is translation of dna (+/- start/stop codons)

510

511

MapList map = new MapList(new int[] { cdnaStart, cdnaEnd },

512

new int[]

513

{ proteinStart, proteinEnd }, CODON_LENGTH, 1);

return map;

}

* translation failed - try mapping CDS annotated regions of dna

519

520

return mapCdsToProtein(cdnaSeq, proteinSeq);

}

/**

* Test whether the given cdna sequence, starting at the given offset,

525

* translates to the given amino acid sequence, using the standard translation

526

* table. Designed to fail fast i.e. as soon as a mismatch position is found.

527

528

* @param cdnaSeqChars

* @param cdnaStart

* @param aaSeqChars

* @return

protected static boolean translatesAs(char[] cdnaSeqChars, int cdnaStart,

534

char[] aaSeqChars)

535

{

536

if (cdnaSeqChars == null || aaSeqChars == null)

{

return false;

}

int aaPos = 0;

int dnaPos = cdnaStart;

543

162

for (; dnaPos < cdnaSeqChars.length - 2

544

&& aaPos < aaSeqChars.length; dnaPos += CODON_LENGTH, aaPos++)

545

{

546

131

String codon = String.valueOf(cdnaSeqChars, dnaPos, CODON_LENGTH);

547

131

final String translated = ResidueProperties.codonTranslate(codon);

548

549

550

* allow * in protein to match untranslatable in dna

551

552

131

final char aaRes = aaSeqChars[aaPos];

553

131

if ((translated == null || ResidueProperties.STOP.equals(translated))

&& aaRes == '*')

{

continue;

}

127

if (translated == null || !(aaRes == translated.charAt(0)))

559

{

560

// debug

561

// jalview.bin.Console.outPrintln(("Mismatch at " + i + "/" + aaResidue

562

// + ": "

563

// + codon + "(" + translated + ") != " + aaRes));

return false;

}

}

* check we matched all of the protein sequence

570

571

if (aaPos != aaSeqChars.length)

{

return false;

}

* check we matched all of the dna except

578

* for optional trailing STOP codon

579

580

if (dnaPos == cdnaSeqChars.length)

{

return true;

}

if (dnaPos == cdnaSeqChars.length - CODON_LENGTH)

585

{

586

String codon = String.valueOf(cdnaSeqChars, dnaPos, CODON_LENGTH);

587

if (ResidueProperties.STOP

588

.equals(ResidueProperties.codonTranslate(codon)))

{

return true;

}

}

return false;

}

/**

* Align sequence 'seq' to match the alignment of a mapped sequence. Note this

598

* currently assumes that we are aligning cDNA to match protein.

599

600

* @param seq

601

* the sequence to be realigned

602

* @param al

603

* the alignment whose sequence alignment is to be 'copied'

604

* @param gap

605

* character string represent a gap in the realigned sequence

606

* @param preserveUnmappedGaps

607

* @param preserveMappedGaps

608

* @return true if the sequence was realigned, false if it could not be

609

610

public static boolean alignSequenceAs(SequenceI seq, AlignmentI al,

611

String gap, boolean preserveMappedGaps,

612

boolean preserveUnmappedGaps)

613

{

614

615

* Get any mappings from the source alignment to the target (dataset)

616

* sequence.

617

618

// TODO there may be one AlignedCodonFrame per dataset sequence, or one with

619

// all mappings. Would it help to constrain this?

620

List<AlignedCodonFrame> mappings = al.getCodonFrame(seq);

621

if (mappings == null || mappings.isEmpty())

{

return false;

}

* Locate the aligned source sequence whose dataset sequence is mapped. We

628

* just take the first match here (as we can't align like more than one

629

* sequence).

630

631

SequenceI alignFrom = null;

632

AlignedCodonFrame mapping = null;

633

for (AlignedCodonFrame mp : mappings)

634

{

635

alignFrom = mp.findAlignedSequence(seq, al);

636

if (alignFrom != null)

{

mapping = mp;

break;

}

}

if (alignFrom == null)

{

return false;

}

alignSequenceAs(seq, alignFrom, mapping, gap, al.getGapCharacter(),

648

preserveMappedGaps, preserveUnmappedGaps);

return true;

}

/**

* Align sequence 'alignTo' the same way as 'alignFrom', using the mapping to

654

* match residues and codons. Flags control whether existing gaps in unmapped

655

* (intron) and mapped (exon) regions are preserved or not. Gaps between

656

* intron and exon are only retained if both flags are set.

* @param alignTo

* @param alignFrom

* @param mapping

* @param myGap

* @param sourceGap

* @param preserveUnmappedGaps

664

* @param preserveMappedGaps

665

666

public static void alignSequenceAs(SequenceI alignTo, SequenceI alignFrom,

667

AlignedCodonFrame mapping, String myGap, char sourceGap,

668

boolean preserveMappedGaps, boolean preserveUnmappedGaps)

669

{

670

// TODO generalise to work for Protein-Protein, dna-dna, dna-protein

671

672

// aligned and dataset sequence positions, all base zero

int thisSeqPos = 0;

int sourceDsPos = 0;

int basesWritten = 0;

677

char myGapChar = myGap.charAt(0);

678

int ratio = myGap.length();

679

680

int fromOffset = alignFrom.getStart() - 1;

681

int toOffset = alignTo.getStart() - 1;

682

int sourceGapMappedLength = 0;

683

boolean inExon = false;

684

final int toLength = alignTo.getLength();

685

final int fromLength = alignFrom.getLength();

686

StringBuilder thisAligned = new StringBuilder(2 * toLength);

687

688

689

* Traverse the 'model' aligned sequence

690

691

205

for (int i = 0; i < fromLength; i++)

692

{

693

186

char sourceChar = alignFrom.getCharAt(i);

694

186

if (sourceChar == sourceGap)

695

{

696

sourceGapMappedLength += ratio;

continue;

}

* Found a non-gap character. Locate its mapped region if any.

702

703

142

sourceDsPos++;

704

// Note mapping positions are base 1, our sequence positions base 0

705

142

int[] mappedPos = mapping.getMappedRegion(alignTo, alignFrom,

706

sourceDsPos + fromOffset);

707

142

if (mappedPos == null)

708

{

709

710

* unmapped position; treat like a gap

711

712

sourceGapMappedLength += ratio;

713

// jalview.bin.Console.errPrintln("Can't align: no codon mapping to

714

// residue "

715

// + sourceDsPos + "(" + sourceChar + ")");

// return;

continue;

}

int mappedCodonStart = mappedPos[0]; // position (1...) of codon start

721

int mappedCodonEnd = mappedPos[mappedPos.length - 1]; // codon end pos

722

StringBuilder trailingCopiedGap = new StringBuilder();

723

724

725

* Copy dna sequence up to and including this codon. Optionally, include

726

* gaps before the codon starts (in introns) and/or after the codon starts

727

* (in exons).

728

729

* Note this only works for 'linear' splicing, not reverse or interleaved.

730

* But then 'align dna as protein' doesn't make much sense otherwise.

731

732

int intronLength = 0;

733

294

while (basesWritten + toOffset < mappedCodonEnd

734

&& thisSeqPos < toLength)

735

{

736

246

final char c = alignTo.getCharAt(thisSeqPos++);

737

246

if (c != myGapChar)

738

{

739

146

basesWritten++;

740

146

int sourcePosition = basesWritten + toOffset;

741

146

if (sourcePosition < mappedCodonStart)

742

{

743

744

* Found an unmapped (intron) base. First add in any preceding gaps

745

* (if wanted).

746

747

if (preserveUnmappedGaps && trailingCopiedGap.length() > 0)

748

{

749

thisAligned.append(trailingCopiedGap.toString());

750

intronLength += trailingCopiedGap.length();

751

trailingCopiedGap = new StringBuilder();

}

intronLength++;

inExon = false;

}

else

{

final boolean startOfCodon = sourcePosition == mappedCodonStart;

759

int gapsToAdd = calculateGapsToInsert(preserveMappedGaps,

760

preserveUnmappedGaps, sourceGapMappedLength, inExon,

761

trailingCopiedGap.length(), intronLength, startOfCodon);

762

215

for (int k = 0; k < gapsToAdd; k++)

763

{

764

117

thisAligned.append(myGapChar);

765

}

766

sourceGapMappedLength = 0;

767

inExon = true;

768

}

769

146

thisAligned.append(c);

770

146

trailingCopiedGap = new StringBuilder();

}

else

{

100

if (inExon && preserveMappedGaps)

775

{

776

trailingCopiedGap.append(myGapChar);

777

}

778

else if (!inExon && preserveUnmappedGaps)

779

{

780

trailingCopiedGap.append(myGapChar);

}

}

}

}

* At end of model aligned sequence. Copy any remaining target sequence, optionally

788

* including (intron) gaps.

789

790

129

while (thisSeqPos < toLength)

791

{

792

110

final char c = alignTo.getCharAt(thisSeqPos++);

793

110

if (c != myGapChar || preserveUnmappedGaps)

794

{

795

102

thisAligned.append(c);

796

}

797

110

sourceGapMappedLength--;

}

* finally add gaps to pad for any trailing source gaps or

802

* unmapped characters

803

804

if (preserveUnmappedGaps)

805

{

806

while (sourceGapMappedLength > 0)

807

{

808

thisAligned.append(myGapChar);

809

sourceGapMappedLength--;

}

}

* All done aligning, set the aligned sequence.

815

816

alignTo.setSequence(new String(thisAligned));

}

/**

* Helper method to work out how many gaps to insert when realigning.

821

822

* @param preserveMappedGaps

823

* @param preserveUnmappedGaps

824

* @param sourceGapMappedLength

825

* @param inExon

826

* @param trailingCopiedGap

827

* @param intronLength

828

* @param startOfCodon

829

* @return

830

831

protected static int calculateGapsToInsert(boolean preserveMappedGaps,

832

boolean preserveUnmappedGaps, int sourceGapMappedLength,

833

boolean inExon, int trailingGapLength, int intronLength,

834

final boolean startOfCodon)

{

int gapsToAdd = 0;

if (startOfCodon)

{

* Reached start of codon. Ignore trailing gaps in intron unless we are

841

* preserving gaps in both exon and intron. Ignore them anyway if the

842

* protein alignment introduces a gap at least as large as the intronic

843

* region.

844

845

if (inExon && !preserveMappedGaps)

846

{

847

trailingGapLength = 0;

848

}

849

if (!inExon && !(preserveMappedGaps && preserveUnmappedGaps))

850

{

851

trailingGapLength = 0;

}

if (inExon)

{

gapsToAdd = Math.max(sourceGapMappedLength, trailingGapLength);

}

else

{

if (intronLength + trailingGapLength <= sourceGapMappedLength)

860

{

861

gapsToAdd = sourceGapMappedLength - intronLength;

}

else

{

gapsToAdd = Math.min(

866

intronLength + trailingGapLength - sourceGapMappedLength,

trailingGapLength);

}

}

}

else

{

* second or third base of codon; check for any gaps in dna

875

876

if (!preserveMappedGaps)

877

{

878

trailingGapLength = 0;

879

}

880

gapsToAdd = Math.max(sourceGapMappedLength, trailingGapLength);

}

return gapsToAdd;

}

/**

* Realigns the given protein to match the alignment of the dna, using codon

887

* mappings to translate aligned codon positions to protein residues.

888

889

* @param protein

890

* the alignment whose sequences are realigned by this method

891

* @param dna

892

* the dna alignment whose alignment we are 'copying'

893

* @return the number of sequences that were realigned

894

895

public static int alignProteinAsDna(AlignmentI protein, AlignmentI dna)

896

{

897

if (protein.isNucleotide() || !dna.isNucleotide())

898

{

899

jalview.bin.Console

900

.errPrintln("Wrong alignment type in alignProteinAsDna");

901

return 0;

902

}

903

List<SequenceI> unmappedProtein = new ArrayList<>();

904

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons = buildCodonColumnsMap(

905

protein, dna, unmappedProtein);

906

return alignProteinAs(protein, alignedCodons, unmappedProtein);

}

/**

* Realigns the given dna to match the alignment of the protein, using codon

911

* mappings to translate aligned peptide positions to codons.

912

913

* Always produces a padded CDS alignment.

914

915

* @param dna

916

* the alignment whose sequences are realigned by this method

917

* @param protein

918

* the protein alignment whose alignment we are 'copying'

919

* @return the number of sequences that were realigned

920

921

public static int alignCdsAsProtein(AlignmentI dna, AlignmentI protein)

922

{

923

if (protein.isNucleotide() || !dna.isNucleotide())

924

{

925

jalview.bin.Console

926

.errPrintln("Wrong alignment type in alignProteinAsDna");

927

return 0;

928

}

929

// todo: implement this

930

List<AlignedCodonFrame> mappings = protein.getCodonFrames();

931

int alignedCount = 0;

932

int width = 0; // alignment width for padding CDS

933

for (SequenceI dnaSeq : dna.getSequences())

934

{

935

if (alignCdsSequenceAsProtein(dnaSeq, protein, mappings,

936

dna.getGapCharacter()))

{

alignedCount++;

}

width = Math.max(dnaSeq.getLength(), width);

}

int oldwidth;

int diff;

for (SequenceI dnaSeq : dna.getSequences())

945

{

946

oldwidth = dnaSeq.getLength();

947

diff = width - oldwidth;

948

if (diff > 0)

949

{

950

dnaSeq.insertCharAt(oldwidth, diff, dna.getGapCharacter());

}

}

return alignedCount;

}

/**

* Helper method to align (if possible) the dna sequence to match the

958

* alignment of a mapped protein sequence. This is currently limited to

959

* handling coding sequence only.

* @param cdsSeq

* @param protein

* @param mappings

* @param gapChar

* @return

static boolean alignCdsSequenceAsProtein(SequenceI cdsSeq,

968

AlignmentI protein, List<AlignedCodonFrame> mappings,

969

char gapChar)

970

{

971

SequenceI cdsDss = cdsSeq.getDatasetSequence();

if (cdsDss == null)

{

System.err

.println("alignCdsSequenceAsProtein needs aligned sequence!");

return false;

}

List<AlignedCodonFrame> dnaMappings = MappingUtils

980

.findMappingsForSequence(cdsSeq, mappings);

981

for (AlignedCodonFrame mapping : dnaMappings)

982

{

983

SequenceI peptide = mapping.findAlignedSequence(cdsSeq, protein);

984

if (peptide != null)

985

{

986

final int peptideLength = peptide.getLength();

987

Mapping map = mapping.getMappingBetween(cdsSeq, peptide);

988

if (map != null)

989

{

990

MapList mapList = map.getMap();

991

if (map.getTo() == peptide.getDatasetSequence())

992

{

993

mapList = mapList.getInverse();

994

}

995

final int cdsLength = cdsDss.getLength();

996

int mappedFromLength = MappingUtils

997

.getLength(mapList.getFromRanges());

998

int mappedToLength = MappingUtils

999

.getLength(mapList.getToRanges());

1000

boolean addStopCodon = (cdsLength == mappedFromLength

1001

* CODON_LENGTH + CODON_LENGTH)

1002

|| (peptide.getDatasetSequence()

1003

.getLength() == mappedFromLength - 1);

1004

if (cdsLength != mappedToLength && !addStopCodon)

1005

{

1006

jalview.bin.Console.errPrintln(String.format(

1007

"Can't align cds as protein (length mismatch %d/%d): %s",

1008

cdsLength, mappedToLength, cdsSeq.getName()));

}

* pre-fill the aligned cds sequence with gaps

1013

1014

char[] alignedCds = new char[peptideLength * CODON_LENGTH

1015

+ (addStopCodon ? CODON_LENGTH : 0)];

1016

Arrays.fill(alignedCds, gapChar);

1017

1018

1019

* walk over the aligned peptide sequence and insert mapped

1020

* codons for residues in the aligned cds sequence

1021

1022

int copiedBases = 0;

1023

int cdsStart = cdsDss.getStart();

1024

int proteinPos = peptide.getStart() - 1;

1025

int cdsCol = 0;

1026

1027

for (int col = 0; col < peptideLength; col++)

1028

{

1029

char residue = peptide.getCharAt(col);

1030

1031

if (Comparison.isGap(residue))

1032

{

1033

cdsCol += CODON_LENGTH;

}

else

{

proteinPos++;

int[] codon = mapList.locateInTo(proteinPos, proteinPos);

1039

if (codon == null)

1040

{

1041

// e.g. incomplete start codon, X in peptide

1042

cdsCol += CODON_LENGTH;

}

else

{

for (int j = codon[0]; j <= codon[1]; j++)

1047

{

1048

char mappedBase = cdsDss.getCharAt(j - cdsStart);

1049

alignedCds[cdsCol++] = mappedBase;

copiedBases++;

}

}

}

}

* append stop codon if not mapped from protein,

1058

* closing it up to the end of the mapped sequence

1059

1060

if (copiedBases == cdsLength - CODON_LENGTH)

1061

{

1062

for (int i = alignedCds.length - 1; i >= 0; i--)

1063

{

1064

if (!Comparison.isGap(alignedCds[i]))

1065

{

1066

cdsCol = i + 1; // gap just after end of sequence

break;

}

}

for (int i = cdsLength - CODON_LENGTH; i < cdsLength; i++)

1071

{

1072

alignedCds[cdsCol++] = cdsDss.getCharAt(i);

1073

}

1074

}

1075

cdsSeq.setSequence(new String(alignedCds));

return true;

}

}

}

return false;

}

/**

* Builds a map whose key is an aligned codon position (3 alignment column

1085

* numbers base 0), and whose value is a map from protein sequence to each

1086

* protein's peptide residue for that codon. The map generates an ordering of

1087

* the codons, and allows us to read off the peptides at each position in

1088

* order to assemble 'aligned' protein sequences.

1089

1090

* @param protein

1091

* the protein alignment

1092

* @param dna

1093

* the coding dna alignment

1094

* @param unmappedProtein

1095

* any unmapped proteins are added to this list

1096

* @return

1097

1098

protected static Map<AlignedCodon, Map<SequenceI, AlignedCodon>> buildCodonColumnsMap(

1099

AlignmentI protein, AlignmentI dna,

1100

List<SequenceI> unmappedProtein)

1101

{

1102

1103

* maintain a list of any proteins with no mappings - these will be

1104

* rendered 'as is' in the protein alignment as we can't align them

1105

1106

unmappedProtein.addAll(protein.getSequences());

1107

1108

List<AlignedCodonFrame> mappings = protein.getCodonFrames();

1109

1110

1111

* Map will hold, for each aligned codon position e.g. [3, 5, 6], a map of

1112

* {dnaSequence, {proteinSequence, codonProduct}} at that position. The

1113

* comparator keeps the codon positions ordered.

1114

1115

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons = new TreeMap<>(

1116

new CodonComparator());

1117

1118

for (SequenceI dnaSeq : dna.getSequences())

1119

{

1120

for (AlignedCodonFrame mapping : mappings)

1121

{

1122

516

SequenceI prot = mapping.findAlignedSequence(dnaSeq, protein);

1123

516

if (prot != null)

1124

{

1125

Mapping seqMap = mapping.getMappingForSequence(dnaSeq);

1126

addCodonPositions(dnaSeq, prot, protein.getGapCharacter(), seqMap,

1127

alignedCodons);

1128

unmappedProtein.remove(prot);

}

}

}

* Finally add any unmapped peptide start residues (e.g. for incomplete

1135

* codons) as if at the codon position before the second residue

1136

1137

// TODO resolve JAL-2022 so this fudge can be removed

1138

int mappedSequenceCount = protein.getHeight() - unmappedProtein.size();

1139

addUnmappedPeptideStarts(alignedCodons, mappedSequenceCount);

1140

1141

return alignedCodons;

}

/**

* Scans for any protein mapped from position 2 (meaning unmapped start

1146

* position e.g. an incomplete codon), and synthesizes a 'codon' for it at the

1147

* preceding position in the alignment

1148

1149

* @param alignedCodons

1150

* the codon-to-peptide map

1151

* @param mappedSequenceCount

1152

* the number of distinct sequences in the map

1153

1154

protected static void addUnmappedPeptideStarts(

1155

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons,

1156

int mappedSequenceCount)

1157

{

1158

// TODO delete this ugly hack once JAL-2022 is resolved

1159

// i.e. we can model startPhase > 0 (incomplete start codon)

1160

1161

List<SequenceI> sequencesChecked = new ArrayList<>();

1162

AlignedCodon lastCodon = null;

1163

Map<SequenceI, AlignedCodon> toAdd = new HashMap<>();

1164

1165

for (Entry<AlignedCodon, Map<SequenceI, AlignedCodon>> entry : alignedCodons

1166

.entrySet())

1167

{

1168

1913

for (Entry<SequenceI, AlignedCodon> sequenceCodon : entry.getValue()

1169

.entrySet())

1170

{

1171

10670

SequenceI seq = sequenceCodon.getKey();

1172

10670

if (sequencesChecked.contains(seq))

1173

{

1174

10640

continue;

1175

}

1176

sequencesChecked.add(seq);

1177

AlignedCodon codon = sequenceCodon.getValue();

1178

if (codon.peptideCol > 1)

1179

{

1180

jalview.bin.Console.errPrintln(

1181

"Problem mapping protein with >1 unmapped start positions: "

1182

+ seq.getName());

1183

}

1184

else if (codon.peptideCol == 1)

1185

{

1186

1187

* first position (peptideCol == 0) was unmapped - add it

1188

1189

if (lastCodon != null)

1190

{

1191

AlignedCodon firstPeptide = new AlignedCodon(lastCodon.pos1,

1192

lastCodon.pos2, lastCodon.pos3,

1193

String.valueOf(seq.getCharAt(0)), 0);

1194

toAdd.put(seq, firstPeptide);

}

else

{

* unmapped residue at start of alignment (no prior column) -

1200

* 'insert' at nominal codon [0, 0, 0]

1201

1202

AlignedCodon firstPeptide = new AlignedCodon(0, 0, 0,

1203

String.valueOf(seq.getCharAt(0)), 0);

1204

toAdd.put(seq, firstPeptide);

1205

}

1206

}

1207

if (sequencesChecked.size() == mappedSequenceCount)

1208

{

1209

// no need to check past first mapped position in all sequences

break;

}

}

1913

lastCodon = entry.getKey();

}

* add any new codons safely after iterating over the map

1218

1219

for (Entry<SequenceI, AlignedCodon> startCodon : toAdd.entrySet())

1220

{

1221

addCodonToMap(alignedCodons, startCodon.getValue(),

1222

startCodon.getKey());

}

}

/**

* Update the aligned protein sequences to match the codon alignments given in

* the map.

* @param protein

* @param alignedCodons

1232

* an ordered map of codon positions (columns), with sequence/peptide

1233

* values present in each column

1234

* @param unmappedProtein

1235

* @return

1236

1237

protected static int alignProteinAs(AlignmentI protein,

1238

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons,

1239

List<SequenceI> unmappedProtein)

1240

{

1241

1242

* prefill peptide sequences with gaps

1243

1244

int alignedWidth = alignedCodons.size();

1245

char[] gaps = new char[alignedWidth];

1246

Arrays.fill(gaps, protein.getGapCharacter());

1247

Map<SequenceI, char[]> peptides = new HashMap<>();

1248

for (SequenceI seq : protein.getSequences())

1249

{

1250

if (!unmappedProtein.contains(seq))

1251

{

1252

peptides.put(seq, Arrays.copyOf(gaps, gaps.length));

}

}

* Traverse the codons left to right (as defined by CodonComparator)

1258

* and insert peptides in each column where the sequence is mapped.

1259

* This gives a peptide 'alignment' where residues are aligned if their

1260

* corresponding codons occupy the same columns in the cdna alignment.

1261

1262

int column = 0;

1263

for (AlignedCodon codon : alignedCodons.keySet())

1264

{

1265

1914

final Map<SequenceI, AlignedCodon> columnResidues = alignedCodons

1266

.get(codon);

1267

1914

for (Entry<SequenceI, AlignedCodon> entry : columnResidues.entrySet())

1268

{

1269

10682

char residue = entry.getValue().product.charAt(0);

1270

10682

peptides.get(entry.getKey())[column] = residue;

1271

}

1272

1914

column++;

}

* and finally set the constructed sequences

1277

1278

for (Entry<SequenceI, char[]> entry : peptides.entrySet())

1279

{

1280

entry.getKey().setSequence(new String(entry.getValue()));

}

return 0;

}

/**

* Populate the map of aligned codons by traversing the given sequence

1288

* mapping, locating the aligned positions of mapped codons, and adding those

1289

* positions and their translation products to the map.

1290

1291

* @param dna

1292

* the aligned sequence we are mapping from

1293

* @param protein

1294

* the sequence to be aligned to the codons

1295

* @param gapChar

1296

* the gap character in the dna sequence

1297

* @param seqMap

1298

* a mapping to a sequence translation

1299

* @param alignedCodons

1300

* the map we are building up

1301

1302

static void addCodonPositions(SequenceI dna, SequenceI protein,

1303

char gapChar, Mapping seqMap,

1304

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons)

1305

{

1306

Iterator<AlignedCodon> codons = seqMap.getCodonIterator(dna, gapChar);

1307

1308

1309

* add codon positions, and their peptide translations, to the alignment

1310

* map, while remembering the first codon mapped

1311

1312

10716

while (codons.hasNext())

1313

{

1314

10684

try

1315

{

1316

10684

AlignedCodon codon = codons.next();

1317

10684

addCodonToMap(alignedCodons, codon, protein);

1318

} catch (IncompleteCodonException e)

1319

{

1320

// possible incomplete trailing codon - ignore

1321

} catch (NoSuchElementException e)

1322

{

1323

// possibly peptide lacking STOP

}

}

}

/**

* Helper method to add a codon-to-peptide entry to the aligned codons map

1330

1331

* @param alignedCodons

* @param codon

* @param protein

10690

protected static void addCodonToMap(

1336

Map<AlignedCodon, Map<SequenceI, AlignedCodon>> alignedCodons,

1337

AlignedCodon codon, SequenceI protein)

1338

{

1339

10690

Map<SequenceI, AlignedCodon> seqProduct = alignedCodons.get(codon);

1340

10690

if (seqProduct == null)

1341

{

1342

1914

seqProduct = new HashMap<>();

1343

1914

alignedCodons.put(codon, seqProduct);

1344

}

1345

10690

seqProduct.put(protein, codon);

}

/**

* Returns true if a cDNA/Protein mapping either exists, or could be made,

1350

* between at least one pair of sequences in the two alignments. Currently,

1351

* the logic is:

1352

* <ul>

1353

* <li>One alignment must be nucleotide, and the other protein</li>

1354

* <li>At least one pair of sequences must be already mapped, or mappable</li>

1355

* <li>Mappable means the nucleotide translation matches the protein

1356

* sequence</li>

1357

* <li>The translation may ignore start and stop codons if present in the

* nucleotide</li>

* </ul>

* @param al1

* @param al2

* @return

public static boolean isMappable(AlignmentI al1, AlignmentI al2)

1366

{

1367

if (al1 == null || al2 == null || al1 == al2)

{

return false;

}

* Require one nucleotide and one protein

1374

1375

if (al1.isNucleotide() == al2.isNucleotide())

1376

{

1377

// or if protein - check if alternate coding

1378

if (al1.isNucleotide())

{

return false;

}

return check3diPeptideMapping(al1,al2);

1383

}

1384

AlignmentI dna = al1.isNucleotide() ? al1 : al2;

1385

AlignmentI protein = dna == al1 ? al2 : al1;

1386

List<AlignedCodonFrame> mappings = protein.getCodonFrames();

1387

for (SequenceI dnaSeq : dna.getSequences())

1388

{

1389

for (SequenceI proteinSeq : protein.getSequences())

1390

{

1391

if (isMappable(dnaSeq, proteinSeq, mappings))

{

return true;

}

}

}

return false;

}

public static boolean check3diPeptideMapping(AlignmentI al1, AlignmentI al2)

1400

{

1401

if (al1.getHeight()!=al2.getHeight())

{ return false;

}

int mappable=0;

for (SequenceI al1seq: al1.getSequences())

1406

{

1407

boolean foundMappable = false;

1408

for (SequenceI al2seq:al2.getSequences())

1409

{

1410

454

if (canBuild3diMapping(al1seq,al2seq))

1411

{

1412

foundMappable = true;

break;

}

}

if (foundMappable)

{

mappable++;

}

}

if (mappable>0 && mappable >= (al1.getHeight()*9/10))

1422

{

1423

// TODO allow optional if mappable > a few

return true;

}

return false;

}

/**

* exact name, start-end, and identical length non-gap sequences

* @param al1seq

* @param al2seq

* @return

466

public static boolean canBuild3diMapping(SequenceI al1seq,

1436

SequenceI al2seq)

1437

{

1438

466

if (!al1seq.getDisplayId(true)

1439

.equalsIgnoreCase(al2seq.getDisplayId(true))) {

1440

458

return false;

1441

}

1442

String s1 = AlignSeq

1443

.extractGaps(jalview.util.Comparison.GapChars,

1444

al1seq.getSequenceAsString());

1445

String s2 = AlignSeq.extractGaps(

1446

jalview.util.Comparison.GapChars,

1447

al2seq.getSequenceAsString());

1448

return s1.length()==s2.length();

1449

}

1450

1451

public static boolean map3diPeptideToProteinAligment(

1452

AlignmentI proteinAlignment, AlignmentI tdiAlignment)

1453

{

1454

if (proteinAlignment==null || tdiAlignment==null)

{

return false;

}

Set<SequenceI> mappedDna = new HashSet<>();

1459

Set<SequenceI> mappedProtein = new HashSet<>();

1460

1461

1462

* First pass - map sequences where cross-references exist. This include

1463

* 1-to-many mappings to support, for example, variant cDNA.

1464

1465

boolean mappingPerformed = mapProteinToTdiAlignment(proteinAlignment,

1466

tdiAlignment, mappedDna, mappedProtein);

1467

return mappingPerformed;

}

/**

* Make mappings between compatible sequences (ids are identical, length of seqs are identical).

1475

1476

* @param proteinAlignment

1477

* @param tdiAlignment

1478

* @param mappedTdiSeq

1479

* a set of mapped DNA sequences (to add to)

1480

* @param mappedProtein

1481

* a set of mapped Protein sequences (to add to)

1482

* @param xrefsOnly

1483

* if true, only map sequences where xrefs exist

1484

* @return

1485

1486

protected static boolean mapProteinToTdiAlignment(

1487

final AlignmentI proteinAlignment, final AlignmentI tdiAlignment,

1488

Set<SequenceI> mappedTdiSeq, Set<SequenceI> mappedProtein)

1489

{

1490

boolean mappingExistsOrAdded = false;

1491

List<SequenceI> thisSeqs = proteinAlignment.getSequences();

1492

for (SequenceI aaSeq : thisSeqs)

1493

{

1494

aaSeq = aaSeq.getDatasetSequence()!=null ? aaSeq.getDatasetSequence():null;

1495

boolean proteinMapped = false;

1496

AlignedCodonFrame acf = new AlignedCodonFrame();

1497

1498

for (SequenceI cdnaSeq : tdiAlignment.getSequences())

1499

{

1500

// resolve dataset sequences

1501

cdnaSeq = cdnaSeq.getDatasetSequence()!=null ? cdnaSeq.getDatasetSequence():null;

1502

1503

if (mappingExists(proteinAlignment.getCodonFrames(),

1504

aaSeq, cdnaSeq))

1505

{

1506

mappingExistsOrAdded = true;

}

else

{

if (canBuild3diMapping(aaSeq, cdnaSeq))

1512

{

1513

MapList map = new MapList(new int[] { aaSeq.getStart(),aaSeq.getEnd()},new int[] { cdnaSeq.getStart(),cdnaSeq.getEnd()},1,1);

1514

acf.addMap(cdnaSeq, aaSeq, map);

1515

mappingExistsOrAdded = true;

1516

proteinMapped = true;

1517

mappedTdiSeq.add(cdnaSeq);

1518

mappedProtein.add(aaSeq);

}

}

}

if (proteinMapped)

{

proteinAlignment.addCodonFrame(acf);

1525

}

1526

}

1527

return mappingExistsOrAdded;

}

/**

* Returns true if the dna sequence is mapped, or could be mapped, to the

* protein sequence.

* @param dnaSeq

* @param proteinSeq

* @param mappings

* @return

protected static boolean isMappable(SequenceI dnaSeq,

1541

SequenceI proteinSeq, List<AlignedCodonFrame> mappings)

1542

{

1543

if (dnaSeq == null || proteinSeq == null)

{

return false;

}

SequenceI dnaDs = dnaSeq.getDatasetSequence() == null ? dnaSeq

1549

: dnaSeq.getDatasetSequence();

1550

SequenceI proteinDs = proteinSeq.getDatasetSequence() == null

1551

? proteinSeq

1552

: proteinSeq.getDatasetSequence();

1553

1554

for (AlignedCodonFrame mapping : mappings)

1555

{

1556

if (proteinDs == mapping.getAaForDnaSeq(dnaDs))

{

* already mapped

return true;

}

}

* Just try to make a mapping (it is not yet stored), test whether

1567

* successful.

1568

1569

return mapCdnaToProtein(proteinDs, dnaDs) != null;

}

/**

* Finds any reference annotations associated with the sequences in

1574

* sequenceScope, that are not already added to the alignment, and adds them

1575

* to the 'candidates' map. Also populates a lookup table of annotation

1576

* labels, keyed by calcId, for use in constructing tooltips or the like.

1577

1578

* @param sequenceScope

1579

* the sequences to scan for reference annotations

1580

* @param labelForCalcId

1581

* (optional) map to populate with label for calcId

1582

* @param candidates

1583

* map to populate with annotations for sequence

1584

* @param al

1585

* the alignment to check for presence of annotations

1586

1587

public static void findAddableReferenceAnnotations(

1588

List<SequenceI> sequenceScope, Map<String, String> labelForCalcId,

1589

final Map<SequenceI, List<AlignmentAnnotation>> candidates,

1590

AlignmentI al)

1591

{

1592

if (sequenceScope == null)

{

return;

}

* For each sequence in scope, make a list of any annotations on the

1599

* underlying dataset sequence which are not already on the alignment.

1600

1601

* Add to a map of { alignmentSequence, <List of annotations to add> }

1602

1603

for (SequenceI seq : sequenceScope)

1604

{

1605

SequenceI dataset = seq.getDatasetSequence();

if (dataset == null)

{

continue;

}

AlignmentAnnotation[] datasetAnnotations = dataset.getAnnotation();

1611

if (datasetAnnotations == null)

{

continue;

}

final List<AlignmentAnnotation> result = new ArrayList<>();

1616

for (AlignmentAnnotation dsann : datasetAnnotations)

1617

{

1618

156

if (dsann.annotations == null) {

1619

continue;// ignore non-positional annotation

1620

}

1621

1622

* Find matching annotations on the alignment. If none is found, then

1623

* add this annotation to the list of 'addable' annotations for this

1624

* sequence.

1625

1626

156

final Iterable<AlignmentAnnotation> matchedAlignmentAnnotations = al

1627

.findAnnotations(seq, dsann.getCalcId(), dsann.label);

1628

156

boolean found = false;

1629

156

if (matchedAlignmentAnnotations != null)

1630

{

1631

153

for (AlignmentAnnotation matched : matchedAlignmentAnnotations)

1632

{

1633

127

if (dsann.description.equals(matched.description))

{

found = true;

break;

}

}

}

156

if (!found) {

1641

107

result.add(dsann);

1642

107

if (labelForCalcId != null)

1643

{

1644

labelForCalcId.put(dsann.getCalcId(), dsann.label);

}

}

}

* Save any addable annotations for this sequence

1650

1651

if (!result.isEmpty())

1652

{

1653

candidates.put(seq, result);

}

}

}

/**

* Adds annotations to the top of the alignment annotations, in the same order

1660

* as their related sequences. If you already have an annotation and want to

1661

* add it to a sequence in an alignment use {@code addReferenceAnnotationTo}

1662

1663

* @param annotations

1664

* the annotations to add

1665

* @param alignment

1666

* the alignment to add them to

1667

* @param selectionGroup

1668

* current selection group - may be null, if provided then any added

1669

* annotation will be trimmed to just those columns in the selection

1670

* group

1671

1672

public static void addReferenceAnnotations(

1673

Map<SequenceI, List<AlignmentAnnotation>> annotations,

1674

final AlignmentI alignment, final SequenceGroup selectionGroup)

1675

{

1676

for (SequenceI seq : annotations.keySet())

1677

{

1678

for (AlignmentAnnotation ann : annotations.get(seq))

1679

{

1680

101

addReferenceAnnotationTo(alignment, seq, ann, selectionGroup);

}

}

}

public static boolean isSSAnnotationPresent(

1686

Map<SequenceI, List<AlignmentAnnotation>> annotations)

1687

{

1688

1689

for (SequenceI seq : annotations.keySet())

1690

{

1691

if (isSecondaryStructurePresent(

1692

annotations.get(seq).toArray(new AlignmentAnnotation[0])))

{

return true;

}

}

return false;

}

/**

* Make a copy of a reference annotation {@code ann} and add it to an

1702

* alignment sequence {@code seq} in {@code alignment}, optionally limited to

1703

* the extent of {@code selectionGroup}

* @param alignment

* @param seq

* @param ann

* @param selectionGroup

1709

* current selection group - may be null, if provided then any added

1710

* annotation will be trimmed to just those columns in the selection

1711

* group

1712

* @return annotation added to {@code seq and {@code alignment}

1713

1714

105

public static AlignmentAnnotation addReferenceAnnotationTo(

1715

final AlignmentI alignment, final SequenceI seq,

1716

final AlignmentAnnotation ann, final SequenceGroup selectionGroup)

1717

{

1718

105

AlignmentAnnotation copyAnn = new AlignmentAnnotation(ann);

1719

105

int startRes = 0;

1720

105

int endRes = ann.annotations.length;

1721

105

if (selectionGroup != null)

1722

{

1723

startRes = -1 + Math.min(seq.getEnd(), Math.max(seq.getStart(),

1724

seq.findPosition(selectionGroup.getStartRes())));

1725

endRes = -1 + Math.min(seq.getEnd(),

1726

seq.findPosition(selectionGroup.getEndRes()));

1727

1728

}

1729

105

copyAnn.restrict(startRes, endRes + 0);

1730

1731

1732

* Add to the sequence (sets copyAnn.datasetSequence), unless the

1733

* original annotation is already on the sequence.

1734

1735

105

if (!seq.hasAnnotation(ann))

1736

{

1737

105

ContactMatrixI cm = seq.getDatasetSequence().getContactMatrixFor(ann);

1738

105

if (cm != null)

1739

{

1740

seq.addContactListFor(copyAnn, cm);

1741

}

1742

105

seq.addAlignmentAnnotation(copyAnn);

1743

}

1744

// adjust for gaps

1745

105

copyAnn.adjustForAlignment();

1746

// add to the alignment and set visible

1747

105

alignment.addAnnotation(copyAnn);

1748

105

copyAnn.visible = true;

1749

1750

105

return copyAnn;

}

/**

* Set visibility of alignment annotations of specified types (labels), for

1755

* specified sequences. This supports controls like "Show all secondary

1756

* structure", "Hide all Temp factor", etc.

1757

1758

* @al the alignment to scan for annotations

1759

* @param types

1760

* the types (labels) of annotations to be updated

1761

* @param forSequences

1762

* if not null, only annotations linked to one of these sequences are

1763

* in scope for update; if null, acts on all sequence annotations

1764

* @param anyType

1765

* if this flag is true, 'types' is ignored (label not checked)

1766

* @param doShow

1767

* if true, set visibility on, else set off

1768

1769

public static void showOrHideSequenceAnnotations(AlignmentI al,

1770

Collection<String> types, List<SequenceI> forSequences,

1771

boolean anyType, boolean doShow)

1772

{

1773

AlignmentAnnotation[] anns = al.getAlignmentAnnotation();

1774

if (anns != null)

1775

{

1776

for (AlignmentAnnotation aa : anns)

1777

{

1778

if (anyType || types.contains(aa.label))

1779

{

1780

if ((aa.sequenceRef != null) && (forSequences == null

1781

|| forSequences.contains(aa.sequenceRef)))

{

aa.visible = doShow;

}

}

}

}

}

/**

* Shows or hides auto calculated annotations for a sequence group.

1792

1793

* @param al

1794

* The alignment object with the annotations.

1795

* @param type

1796

* The type of annotation to show or hide.

1797

* @param selectedGroup

1798

* The sequence group for which the annotations should be shown or

1799

* hidden.

1800

* @param anyType

1801

* If true, all types of annotations will be shown/hidden.

1802

* @param doShow

1803

* If true, the annotations will be shown; if false, annotations will

1804

* be hidden.

1805

1806

public static void showOrHideAutoCalculatedAnnotationsForGroup(

1807

AlignmentI al, String type, SequenceGroup selectedGroup,

1808

boolean anyType, boolean doShow)

1809

{

1810

// Get all alignment annotations

1811

AlignmentAnnotation[] anns = al.getAlignmentAnnotation();

if (anns != null)

{

for (AlignmentAnnotation aa : anns)

1816

{

1817

// Check if anyType is true or if the annotation's label contains the

1818

// specified type (currently for secondary structure consensus)

1819

if ((anyType && aa.label

1820

.startsWith(Constants.SECONDARY_STRUCTURE_CONSENSUS_LABEL))

1821

|| aa.label.startsWith(type))

1822

{

1823

// If the annotation's group reference is not null and matches the

1824

// selected group, update its visibility.

1825

if (aa.groupRef != null && selectedGroup == aa.groupRef)

{

aa.visible = doShow;

}

}

}

}

}

public static AlignmentAnnotation getFirstSequenceAnnotationOfType(

1835

AlignmentI al, int graphType)

1836

{

1837

AlignmentAnnotation[] anns = al.getAlignmentAnnotation();

1838

if (anns != null)

1839

{

1840

for (AlignmentAnnotation aa : anns)

1841

{

1842

if (aa.sequenceRef != null && aa.graph == graphType)

return aa;

}

}

return null;

}

/**

* Returns true if either sequence has a cross-reference to the other

* @param seq1

* @param seq2

* @return

public static boolean haveCrossRef(SequenceI seq1, SequenceI seq2)

1857

{

1858

// Note: moved here from class CrossRef as the latter class has dependencies

1859

// not availability to the applet's classpath

1860

return hasCrossRef(seq1, seq2) || hasCrossRef(seq2, seq1);

}

/**

* Returns true if seq1 has a cross-reference to seq2. Currently this assumes

1865

* that sequence name is structured as Source|AccessionId.

* @param seq1

* @param seq2

* @return

108

public static boolean hasCrossRef(SequenceI seq1, SequenceI seq2)

1872

{

1873

108

if (seq1 == null || seq2 == null)

{

return false;

}

100

String name = seq2.getName();

1878

100

final List<DBRefEntry> xrefs = seq1.getDBRefs();

1879

100

if (xrefs != null)

1880

{

1881

for (int ix = 0, nx = xrefs.size(); ix < nx; ix++)

1882

{

1883

DBRefEntry xref = xrefs.get(ix);

1884

String xrefName = xref.getSource() + "|" + xref.getAccessionId();

1885

// case-insensitive test, consistent with DBRefEntry.equalRef()

1886

if (xrefName.equalsIgnoreCase(name))

{

return true;

}

}

}

return false;

}

/**

* Constructs an alignment consisting of the mapped (CDS) regions in the given

1897

* nucleotide sequences, and updates mappings to match. The CDS sequences are

1898

* added to the original alignment's dataset, which is shared by the new

1899

* alignment. Mappings from nucleotide to CDS, and from CDS to protein, are

1900

* added to the alignment dataset.

1901

1902

* @param dna

1903

* aligned nucleotide (dna or cds) sequences

1904

* @param dataset

1905

* the alignment dataset the sequences belong to

1906

* @param products

1907

* (optional) to restrict results to CDS that map to specified

1908

* protein products

1909

* @return an alignment whose sequences are the cds-only parts of the dna

1910

* sequences (or null if no mappings are found)

1911

1912

public static AlignmentI makeCdsAlignment(SequenceI[] dna,

1913

AlignmentI dataset, SequenceI[] products)

1914

{

1915

if (dataset == null || dataset.getDataset() != null)

1916

{

1917

throw new IllegalArgumentException(

1918

"IMPLEMENTATION ERROR: dataset.getDataset() must be null!");

1919

}

1920

List<SequenceI> foundSeqs = new ArrayList<>();

1921

List<SequenceI> cdsSeqs = new ArrayList<>();

1922

List<AlignedCodonFrame> mappings = dataset.getCodonFrames();

1923

HashSet<SequenceI> productSeqs = null;

1924

if (products != null)

1925

{

1926

productSeqs = new HashSet<>();

1927

for (SequenceI seq : products)

1928

{

1929

productSeqs.add(seq.getDatasetSequence() == null ? seq

1930

: seq.getDatasetSequence());

}

}

* Construct CDS sequences from mappings on the alignment dataset.

1936

* The logic is:

1937

* - find the protein product(s) mapped to from each dna sequence

1938

* - if the mapping covers the whole dna sequence (give or take start/stop

1939

* codon), take the dna as the CDS sequence

1940

* - else search dataset mappings for a suitable dna sequence, i.e. one

1941

* whose whole sequence is mapped to the protein

1942

* - if no sequence found, construct one from the dna sequence and mapping

1943

* (and add it to dataset so it is found if this is repeated)

1944

1945

for (SequenceI dnaSeq : dna)

1946

{

1947

SequenceI dnaDss = dnaSeq.getDatasetSequence() == null ? dnaSeq

1948

: dnaSeq.getDatasetSequence();

1949

1950

List<AlignedCodonFrame> seqMappings = MappingUtils

1951

.findMappingsForSequence(dnaSeq, mappings);

1952

for (AlignedCodonFrame mapping : seqMappings)

1953

{

1954

List<Mapping> mappingsFromSequence = mapping

1955

.getMappingsFromSequence(dnaSeq);

1956

1957

for (Mapping aMapping : mappingsFromSequence)

1958

{

1959

MapList mapList = aMapping.getMap();

1960

if (mapList.getFromRatio() == 1)

1961

{

1962

1963

* not a dna-to-protein mapping (likely dna-to-cds)

continue;

}

* skip if mapping is not to one of the target set of proteins

1970

1971

SequenceI proteinProduct = aMapping.getTo();

1972

if (productSeqs != null && !productSeqs.contains(proteinProduct))

{

continue;

}

* try to locate the CDS from the dataset mappings;

1979

* guard against duplicate results (for the case that protein has

1980

* dbrefs to both dna and cds sequences)

1981

1982

SequenceI cdsSeq = findCdsForProtein(mappings, dnaSeq,

1983

seqMappings, aMapping);

1984

if (cdsSeq != null)

1985

{

1986

if (!foundSeqs.contains(cdsSeq))

1987

{

1988

foundSeqs.add(cdsSeq);

1989

SequenceI derivedSequence = cdsSeq.deriveSequence();

1990

cdsSeqs.add(derivedSequence);

1991

if (!dataset.getSequences().contains(cdsSeq))

1992

{

1993

dataset.addSequence(cdsSeq);

}

}

continue;

}

* didn't find mapped CDS sequence - construct it and add

2001

* its dataset sequence to the dataset

2002

2003

cdsSeq = makeCdsSequence(dnaSeq.getDatasetSequence(), aMapping,

2004

dataset).deriveSequence();

2005

// cdsSeq has a name constructed as CDS|<dbref>

2006

// <dbref> will be either the accession for the coding sequence,

2007

// marked in the /via/ dbref to the protein product accession

2008

// or it will be the original nucleotide accession.

2009

SequenceI cdsSeqDss = cdsSeq.getDatasetSequence();

cdsSeqs.add(cdsSeq);

* build the mapping from CDS to protein

2015

2016

List<int[]> cdsRange = Collections

2017

.singletonList(new int[]

2018

{ cdsSeq.getStart(),

2019

cdsSeq.getLength() + cdsSeq.getStart() - 1 });

2020

MapList cdsToProteinMap = new MapList(cdsRange,

2021

mapList.getToRanges(), mapList.getFromRatio(),

2022

mapList.getToRatio());

2023

2024

if (!dataset.getSequences().contains(cdsSeqDss))

2025

{

2026

2027

* if this sequence is a newly created one, add it to the dataset

2028

* and made a CDS to protein mapping (if sequence already exists,

2029

* CDS-to-protein mapping _is_ the transcript-to-protein mapping)

2030

2031

dataset.addSequence(cdsSeqDss);

2032

AlignedCodonFrame cdsToProteinMapping = new AlignedCodonFrame();

2033

cdsToProteinMapping.addMap(cdsSeqDss, proteinProduct,

cdsToProteinMap);

* guard against duplicating the mapping if repeating this action

2038

2039

if (!mappings.contains(cdsToProteinMapping))

2040

{

2041

mappings.add(cdsToProteinMapping);

}

}

propagateDBRefsToCDS(cdsSeqDss, dnaSeq.getDatasetSequence(),

2046

proteinProduct, aMapping);

2047

2048

* add another mapping from original 'from' range to CDS

2049

2050

AlignedCodonFrame dnaToCdsMapping = new AlignedCodonFrame();

2051

final MapList dnaToCdsMap = new MapList(mapList.getFromRanges(),

2052

cdsRange, 1, 1);

2053

dnaToCdsMapping.addMap(dnaSeq.getDatasetSequence(), cdsSeqDss,

2054

dnaToCdsMap);

2055

if (!mappings.contains(dnaToCdsMapping))

2056

{

2057

mappings.add(dnaToCdsMapping);

}

* transfer dna chromosomal loci (if known) to the CDS

2062

* sequence (via the mapping)

2063

2064

final MapList cdsToDnaMap = dnaToCdsMap.getInverse();

2065

transferGeneLoci(dnaSeq, cdsToDnaMap, cdsSeq);

2066

2067

2068

* add DBRef with mapping from protein to CDS

2069

* (this enables Get Cross-References from protein alignment)

2070

* This is tricky because we can't have two DBRefs with the

2071

* same source and accession, so need a different accession for

2072

* the CDS from the dna sequence

2073

2074

2075

// specific use case:

2076

// Genomic contig ENSCHR:1, contains coding regions for ENSG01,

2077

// ENSG02, ENSG03, with transcripts and products similarly named.

2078

// cannot add distinct dbrefs mapping location on ENSCHR:1 to ENSG01

2079

2080

// JBPNote: ?? can't actually create an example that demonstrates we

2081

// need to

2082

// synthesize an xref.

2083

2084

List<DBRefEntry> primrefs = dnaDss.getPrimaryDBRefs();

2085

for (int ip = 0, np = primrefs.size(); ip < np; ip++)

2086

{

2087

DBRefEntry primRef = primrefs.get(ip);

2088

2089

* create a cross-reference from CDS to the source sequence's

2090

* primary reference and vice versa

2091

2092

String source = primRef.getSource();

2093

String version = primRef.getVersion();

2094

DBRefEntry cdsCrossRef = new DBRefEntry(source,

2095

source + ":" + version, primRef.getAccessionId());

2096

cdsCrossRef

2097

.setMap(new Mapping(dnaDss, new MapList(cdsToDnaMap)));

2098

cdsSeqDss.addDBRef(cdsCrossRef);

2099

2100

dnaSeq.addDBRef(new DBRefEntry(source, version,

2101

cdsSeq.getName(), new Mapping(cdsSeqDss, dnaToCdsMap)));

2102

// problem here is that the cross-reference is synthesized -

2103

// cdsSeq.getName() may be like 'CDS|dnaaccession' or

2104

// 'CDS|emblcdsacc'

2105

// assuming cds version same as dna ?!?

2106

2107

DBRefEntry proteinToCdsRef = new DBRefEntry(source, version,

2108

cdsSeq.getName());

2109

2110

proteinToCdsRef.setMap(

2111

new Mapping(cdsSeqDss, cdsToProteinMap.getInverse()));

2112

proteinProduct.addDBRef(proteinToCdsRef);

2113

}

2114

2115

* transfer any features on dna that overlap the CDS

2116

2117

transferFeatures(dnaSeq, cdsSeq, dnaToCdsMap, null,

2118

SequenceOntologyI.CDS);

}

}

}

AlignmentI cds = new Alignment(

2124

cdsSeqs.toArray(new SequenceI[cdsSeqs.size()]));

2125

cds.setDataset(dataset);

return cds;

}

/**

* Tries to transfer gene loci (dbref to chromosome positions) from fromSeq to

2132

* toSeq, mediated by the given mapping between the sequences

2133

2134

* @param fromSeq

2135

* @param targetToFrom

* Map

* @param targetSeq

protected static void transferGeneLoci(SequenceI fromSeq,

2140

MapList targetToFrom, SequenceI targetSeq)

2141

{

2142

if (targetSeq.getGeneLoci() != null)

2143

{

2144

// already have - don't override

2145

return;

2146

}

2147

GeneLociI fromLoci = fromSeq.getGeneLoci();

2148

if (fromLoci == null)

{

return;

}

MapList newMap = targetToFrom.traverse(fromLoci.getMapping());

if (newMap != null)

{

targetSeq.setGeneLoci(fromLoci.getSpeciesId(),

2158

fromLoci.getAssemblyId(), fromLoci.getChromosomeId(), newMap);

}

}

/**

* A helper method that finds a CDS sequence in the alignment dataset that is

2164

* mapped to the given protein sequence, and either is, or has a mapping from,

2165

* the given dna sequence.

2166

2167

* @param mappings

2168

* set of all mappings on the dataset

2169

* @param dnaSeq

2170

* a dna (or cds) sequence we are searching from

2171

* @param seqMappings

2172

* the set of mappings involving dnaSeq

2173

* @param aMapping

2174

* a transcript-to-peptide mapping

2175

* @return

2176

2177

static SequenceI findCdsForProtein(List<AlignedCodonFrame> mappings,

2178

SequenceI dnaSeq, List<AlignedCodonFrame> seqMappings,

Mapping aMapping)

{

* TODO a better dna-cds-protein mapping data representation to allow easy

2183

* navigation; until then this clunky looping around lists of mappings

2184

2185

SequenceI seqDss = dnaSeq.getDatasetSequence() == null ? dnaSeq

2186

: dnaSeq.getDatasetSequence();

2187

SequenceI proteinProduct = aMapping.getTo();

2188

2189

2190

* is this mapping from the whole dna sequence (i.e. CDS)?

2191

* allowing for possible stop codon on dna but not peptide

2192

2193

int mappedFromLength = MappingUtils

2194

.getLength(aMapping.getMap().getFromRanges());

2195

int dnaLength = seqDss.getLength();

2196

if (mappedFromLength == dnaLength

2197

|| mappedFromLength == dnaLength - CODON_LENGTH)

2198

{

2199

2200

* if sequence has CDS features, this is a transcript with no UTR

2201

* - do not take this as the CDS sequence! (JAL-2789)

2202

2203

if (seqDss.getFeatures().getFeaturesByOntology(SequenceOntologyI.CDS)

.isEmpty())

{

return seqDss;

}

}

* looks like we found the dna-to-protein mapping; search for the

2212

* corresponding cds-to-protein mapping

2213

2214

List<AlignedCodonFrame> mappingsToPeptide = MappingUtils

2215

.findMappingsForSequence(proteinProduct, mappings);

2216

for (AlignedCodonFrame acf : mappingsToPeptide)

2217

{

2218

for (SequenceToSequenceMapping map : acf.getMappings())

2219

{

2220

276

Mapping mapping = map.getMapping();

2221

276

if (mapping != aMapping

2222

&& mapping.getMap().getFromRatio() == CODON_LENGTH

2223

&& proteinProduct == mapping.getTo()

2224

&& seqDss != map.getFromSeq())

2225

{

2226

mappedFromLength = MappingUtils

2227

.getLength(mapping.getMap().getFromRanges());

2228

if (mappedFromLength == map.getFromSeq().getLength())

2229

{

2230

2231

* found a 3:1 mapping to the protein product which covers

2232

* the whole dna sequence i.e. is from CDS; finally check the CDS

2233

* is mapped from the given dna start sequence

2234

2235

SequenceI cdsSeq = map.getFromSeq();

2236

// todo this test is weak if seqMappings contains multiple mappings;

2237

// we get away with it if transcript:cds relationship is 1:1

2238

List<AlignedCodonFrame> dnaToCdsMaps = MappingUtils

2239

.findMappingsForSequence(cdsSeq, seqMappings);

2240

if (!dnaToCdsMaps.isEmpty())

{

return cdsSeq;

}

}

}

}

}

return null;

}

/**

* Helper method that makes a CDS sequence as defined by the mappings from the

2253

* given sequence i.e. extracts the 'mapped from' ranges (which may be on

2254

* forward or reverse strand).

* @param seq

* @param mapping

* @param dataset

* - existing dataset. We check for sequences that look like the CDS

2260

* we are about to construct, if one exists already, then we will

2261

* just return that one.

2262

* @return CDS sequence (as a dataset sequence)

2263

2264

static SequenceI makeCdsSequence(SequenceI seq, Mapping mapping,

AlignmentI dataset)

{

* construct CDS sequence name as "CDS|" with 'from id' held in the mapping

2269

* if set (e.g. EMBL protein_id), else sequence name appended

2270

2271

String mapFromId = mapping.getMappedFromId();

2272

final String seqId = "CDS|"

2273

+ (mapFromId != null ? mapFromId : seq.getName());

2274

2275

SequenceI newSeq = null;

2276

2277

2278

* construct CDS sequence by splicing mapped from ranges

2279

2280

char[] seqChars = seq.getSequence();

2281

List<int[]> fromRanges = mapping.getMap().getFromRanges();

2282

int cdsWidth = MappingUtils.getLength(fromRanges);

2283

char[] newSeqChars = new char[cdsWidth];

2284

2285

int newPos = 0;

2286

for (int[] range : fromRanges)

2287

{

2288

if (range[0] <= range[1])

2289

{

2290

// forward strand mapping - just copy the range

2291

int length = range[1] - range[0] + 1;

2292

System.arraycopy(seqChars, range[0] - 1, newSeqChars, newPos,

length);

newPos += length;

}

else

{

// reverse strand mapping - copy and complement one by one

2299

for (int i = range[0]; i >= range[1]; i--)

2300

{

2301

newSeqChars[newPos++] = Dna.getComplement(seqChars[i - 1]);

}

}

newSeq = new Sequence(seqId, newSeqChars, 1, newPos);

}

if (dataset != null)

{

SequenceI[] matches = dataset.findSequenceMatch(newSeq.getName());

2311

if (matches != null)

2312

{

2313

boolean matched = false;

2314

for (SequenceI mtch : matches)

2315

{

2316

if (mtch.getStart() != newSeq.getStart())

{

continue;

}

if (mtch.getEnd() != newSeq.getEnd())

{

continue;

}

if (!Arrays.equals(mtch.getSequence(), newSeq.getSequence()))

{

continue;

}

if (!matched)

{

matched = true;

newSeq = mtch;

}

else

{

Console.error(

"JAL-2154 regression: warning - found (and ignored) a duplicate CDS sequence:"

+ mtch.toString());

}

}

}

}

// newSeq.setDescription(mapFromId);

return newSeq;

}

/**

* Adds any DBRefEntrys to cdsSeq from contig that have a Mapping congruent to

* the given mapping.

* @param cdsSeq

* @param contig

* @param proteinProduct

2354

* @param mapping

2355

* @return list of DBRefEntrys added

2356

2357

protected static List<DBRefEntry> propagateDBRefsToCDS(SequenceI cdsSeq,

2358

SequenceI contig, SequenceI proteinProduct, Mapping mapping)

2359

{

2360

2361

// gather direct refs from contig congruent with mapping

2362

List<DBRefEntry> direct = new ArrayList<>();

2363

HashSet<String> directSources = new HashSet<>();

2364

2365

List<DBRefEntry> refs = contig.getDBRefs();

2366

if (refs != null)

2367

{

2368

292

for (int ib = 0, nb = refs.size(); ib < nb; ib++)

2369

{

2370

279

DBRefEntry dbr = refs.get(ib);

2371

279

MapList map;

2372

if (dbr.hasMap() && (map = dbr.getMap().getMap()).isTripletMap())

2373

{

2374

// check if map is the CDS mapping

2375

if (mapping.getMap().equals(map))

2376

{

2377

direct.add(dbr);

2378

directSources.add(dbr.getSource());

}

}

}

}

List<DBRefEntry> onSource = DBRefUtils.selectRefs(

2384

proteinProduct.getDBRefs(),

2385

directSources.toArray(new String[0]));

2386

List<DBRefEntry> propagated = new ArrayList<>();

2387

2388

// and generate appropriate mappings

2389

for (int ic = 0, nc = direct.size(); ic < nc; ic++)

2390

{

2391

DBRefEntry cdsref = direct.get(ic);

2392

Mapping m = cdsref.getMap();

2393

// clone maplist and mapping

2394

MapList cdsposmap = new MapList(

2395

Arrays.asList(new int[][]

2396

{ new int[] { cdsSeq.getStart(), cdsSeq.getEnd() } }),

2397

m.getMap().getToRanges(), 3, 1);

2398

Mapping cdsmap = new Mapping(m.getTo(), m.getMap());

2399

2400

// create dbref

2401

DBRefEntry newref = new DBRefEntry(cdsref.getSource(),

2402

cdsref.getVersion(), cdsref.getAccessionId(),

2403

new Mapping(cdsmap.getTo(), cdsposmap));

2404

2405

// and see if we can map to the protein product for this mapping.

2406

// onSource is the filtered set of accessions on protein that we are

2407

// tranferring, so we assume accession is the same.

2408

if (cdsmap.getTo() == null && onSource != null)

2409

{

2410

List<DBRefEntry> sourceRefs = DBRefUtils.searchRefs(onSource,

2411

cdsref.getAccessionId());

2412

if (sourceRefs != null)

2413

{

2414

for (DBRefEntry srcref : sourceRefs)

2415

{

2416

if (srcref.getSource().equalsIgnoreCase(cdsref.getSource()))

2417

{

2418

// we have found a complementary dbref on the protein product, so

2419

// update mapping's getTo

2420

newref.getMap().setTo(proteinProduct);

}

}

}

}

cdsSeq.addDBRef(newref);

2426

propagated.add(newref);

}

return propagated;

}

/**

* Transfers co-located features on 'fromSeq' to 'toSeq', adjusting the

2433

* feature start/end ranges, optionally omitting specified feature types.

2434

* Returns the number of features copied.

* @param fromSeq

* @param toSeq

* @param mapping

* the mapping from 'fromSeq' to 'toSeq'

2440

* @param select

2441

* if not null, only features of this type are copied (including

2442

* subtypes in the Sequence Ontology)

2443

* @param omitting

2444

2445

protected static int transferFeatures(SequenceI fromSeq, SequenceI toSeq,

2446

MapList mapping, String select, String... omitting)

2447

{

2448

SequenceI copyTo = toSeq;

2449

while (copyTo.getDatasetSequence() != null)

2450

{

2451

copyTo = copyTo.getDatasetSequence();

2452

}

2453

if (fromSeq == copyTo || fromSeq.getDatasetSequence() == copyTo)

2454

{

2455

return 0; // shared dataset sequence

}

* get features, optionally restricted by an ontology term

2460

2461

List<SequenceFeature> sfs = select == null

2462

? fromSeq.getFeatures().getPositionalFeatures()

2463

: fromSeq.getFeatures().getFeaturesByOntology(select);

2464

2465

int count = 0;

2466

for (SequenceFeature sf : sfs)

2467

{

2468

9610

String type = sf.getType();

2469

9610

boolean omit = false;

2470

9610

for (String toOmit : omitting)

2471

{

2472

9603

if (type.equals(toOmit))

2473

{

2474

134

omit = true;

2475

}

2476

}

2477

9610

if (omit)

2478

{

2479

134

continue;

}

* locate the mapped range - null if either start or end is

2484

* not mapped (no partial overlaps are calculated)

2485

2486

9476

int start = sf.getBegin();

2487

9476

int end = sf.getEnd();

2488

9476

int[] mappedTo = mapping.locateInTo(start, end);

2489

2490

* if whole exon range doesn't map, try interpreting it

2491

* as 5' or 3' exon overlapping the CDS range

2492

2493

9476

if (mappedTo == null)

2494

{

2495

4447

mappedTo = mapping.locateInTo(end, end);

2496

4447

if (mappedTo != null)

2497

{

2498

2499

* end of exon is in CDS range - 5' overlap

2500

* to a range from the start of the peptide

mappedTo[0] = 1;

}

}

9476

if (mappedTo == null)

2506

{

2507

4447

mappedTo = mapping.locateInTo(start, start);

2508

4447

if (mappedTo != null)

2509

{

2510

2511

* start of exon is in CDS range - 3' overlap

2512

* to a range up to the end of the peptide

2513

2514

mappedTo[1] = toSeq.getLength();

2515

}

2516

}

2517

9476

if (mappedTo != null)

2518

{

2519

5029

int newBegin = Math.min(mappedTo[0], mappedTo[1]);

2520

5029

int newEnd = Math.max(mappedTo[0], mappedTo[1]);

2521

5029

SequenceFeature copy = new SequenceFeature(sf, newBegin, newEnd,

2522

sf.getFeatureGroup(), sf.getScore());

2523

5029

copyTo.addSequenceFeature(copy);

2524

5029

count++;

}

}

return count;

}

/**

* Returns a mapping from dna to protein by inspecting sequence features of

2532

* type "CDS" on the dna. A mapping is constructed if the total CDS feature

2533

* length is 3 times the peptide length (optionally after dropping a trailing

2534

* stop codon). This method does not check whether the CDS nucleotide sequence

2535

* translates to the peptide sequence.

* @param dnaSeq

* @param proteinSeq

* @return

public static MapList mapCdsToProtein(SequenceI dnaSeq,

2542

SequenceI proteinSeq)

2543

{

2544

List<int[]> ranges = findCdsPositions(dnaSeq);

2545

int mappedDnaLength = MappingUtils.getLength(ranges);

2546

2547

2548

* if not a whole number of codons, truncate mapping

2549

2550

int codonRemainder = mappedDnaLength % CODON_LENGTH;

2551

if (codonRemainder > 0)

2552

{

2553

mappedDnaLength -= codonRemainder;

2554

MappingUtils.removeEndPositions(codonRemainder, ranges);

2555

}

2556

2557

int proteinLength = proteinSeq.getLength();

2558

int proteinStart = proteinSeq.getStart();

2559

int proteinEnd = proteinSeq.getEnd();

2560

2561

2562

* incomplete start codon may mean X at start of peptide

2563

* we ignore both for mapping purposes

2564

2565

if (proteinSeq.getCharAt(0) == 'X')

2566

{

2567

// todo JAL-2022 support startPhase > 0

proteinStart++;

proteinLength--;

}

List<int[]> proteinRange = new ArrayList<>();

2572

2573

2574

* dna length should map to protein (or protein plus stop codon)

2575

2576

int codesForResidues = mappedDnaLength / CODON_LENGTH;

2577

if (codesForResidues == (proteinLength + 1))

2578

{

2579

// assuming extra codon is for STOP and not in peptide

2580

// todo: check trailing codon is indeed a STOP codon

2581

codesForResidues--;

2582

mappedDnaLength -= CODON_LENGTH;

2583

MappingUtils.removeEndPositions(CODON_LENGTH, ranges);

2584

}

2585

2586

if (codesForResidues == proteinLength)

2587

{

2588

proteinRange.add(new int[] { proteinStart, proteinEnd });

2589

return new MapList(ranges, proteinRange, CODON_LENGTH, 1);

}

return null;

}

/**

* Returns a list of CDS ranges found (as sequence positions base 1), i.e. of

2596

* [start, end] positions of sequence features of type "CDS" (or a sub-type of

2597

* CDS in the Sequence Ontology). The ranges are sorted into ascending start

2598

* position order, so this method is only valid for linear CDS in the same

2599

* sense as the protein product.

* @param dnaSeq

* @return

protected static List<int[]> findCdsPositions(SequenceI dnaSeq)

2605

{

2606

List<int[]> result = new ArrayList<>();

2607

2608

List<SequenceFeature> sfs = dnaSeq.getFeatures()

2609

.getFeaturesByOntology(SequenceOntologyI.CDS);

if (sfs.isEmpty())

{

return result;

}

SequenceFeatures.sortFeatures(sfs, true);

2615

2616

for (SequenceFeature sf : sfs)

{

int phase = 0;

try

{

String s = sf.getPhase();

2622

if (s != null)

2623

{

2624

phase = Integer.parseInt(s);

2625

}

2626

} catch (NumberFormatException e)

{

// leave as zero

}

* phase > 0 on first codon means 5' incomplete - skip to the start

2632

* of the next codon; example ENST00000496384

2633

2634

int begin = sf.getBegin();

2635

int end = sf.getEnd();

2636

if (result.isEmpty() && phase > 0)

{

begin += phase;

if (begin > end)

{

// shouldn't happen!

System.err

.println("Error: start phase extends beyond start CDS in "

+ dnaSeq.getName());

}

}

result.add(new int[] { begin, end });

}

* Finally sort ranges by start position. This avoids a dependency on

2652

* keeping features in order on the sequence (if they are in order anyway,

2653

* the sort will have almost no work to do). The implicit assumption is CDS

2654

* ranges are assembled in order. Other cases should not use this method,

2655

* but instead construct an explicit mapping for CDS (e.g. EMBL parsing).

2656

2657

Collections.sort(result, IntRangeComparator.ASCENDING);

return result;

}

/**

* Makes an alignment with a copy of the given sequences, adding in any

2663

* non-redundant sequences which are mapped to by the cross-referenced

* sequences.

* @param seqs

* @param xrefs

* @param dataset

* the alignment dataset shared by the new copy

2670

* @return

2671

2672

public static AlignmentI makeCopyAlignment(SequenceI[] seqs,

2673

SequenceI[] xrefs, AlignmentI dataset)

2674

{

2675

AlignmentI copy = new Alignment(new Alignment(seqs));

2676

copy.setDataset(dataset);

2677

boolean isProtein = !copy.isNucleotide();

2678

SequenceIdMatcher matcher = new SequenceIdMatcher(seqs);

2679

if (xrefs != null)

2680

{

2681

// BH 2019.01.25 recoded to remove iterators

2682

2683

for (int ix = 0, nx = xrefs.length; ix < nx; ix++)

2684

{

2685

SequenceI xref = xrefs[ix];

2686

List<DBRefEntry> dbrefs = xref.getDBRefs();

2687

if (dbrefs != null)

2688

{

2689

for (int ir = 0, nir = dbrefs.size(); ir < nir; ir++)

2690

{

2691

DBRefEntry dbref = dbrefs.get(ir);

2692

Mapping map = dbref.getMap();

2693

SequenceI mto;

2694

if (map == null || (mto = map.getTo()) == null

2695

|| mto.isProtein() != isProtein)

{

continue;

}

SequenceI mappedTo = mto;

2700

SequenceI match = matcher.findIdMatch(mappedTo);

2701

if (match == null)

2702

{

2703

matcher.add(mappedTo);

2704

copy.addSequence(mappedTo);

}

}

}

}

}

return copy;

}

/**

* Try to align sequences in 'unaligned' to match the alignment of their

2715

* mapped regions in 'aligned'. For example, could use this to align CDS

2716

* sequences which are mapped to their parent cDNA sequences.

2717

2718

* This method handles 1:1 mappings (dna-to-dna or protein-to-protein). For

2719

* dna-to-protein or protein-to-dna use alternative methods.

2720

2721

* @param unaligned

2722

* sequences to be aligned

2723

* @param aligned

2724

* holds aligned sequences and their mappings

2725

* @return

2726

2727

public static int alignAs(AlignmentI unaligned, AlignmentI aligned)

2728

{

2729

2730

* easy case - aligning a copy of aligned sequences

2731

2732

if (alignAsSameSequences(unaligned, aligned))

2733

{

2734

return unaligned.getHeight();

}

* fancy case - aligning via mappings between sequences

2739

2740

List<SequenceI> unmapped = new ArrayList<>();

2741

Map<Integer, Map<SequenceI, Character>> columnMap = buildMappedColumnsMap(

2742

unaligned, aligned, unmapped);

2743

int width = columnMap.size();

2744

char gap = unaligned.getGapCharacter();

2745

int realignedCount = 0;

2746

// TODO: verify this loop scales sensibly for very wide/high alignments

2747

2748

for (SequenceI seq : unaligned.getSequences())

2749

{

2750

if (!unmapped.contains(seq))

2751

{

2752

char[] newSeq = new char[width];

2753

Arrays.fill(newSeq, gap); // JBPComment - doubt this is faster than the

2754

// Integer iteration below

int newCol = 0;

int lastCol = 0;

* traverse the map to find columns populated

2760

* by our sequence

2761

2762

for (Integer column : columnMap.keySet())

2763

{

2764

59000

Character c = columnMap.get(column).get(seq);

2765

59000

if (c != null)

2766

{

2767

2768

* sequence has a character at this position

2769

2770

2771

32002

newSeq[newCol] = c;

2772

32002

lastCol = newCol;

2773

}

2774

59000

newCol++;

}

* trim trailing gaps

if (lastCol < width)

{

char[] tmp = new char[lastCol + 1];

2783

System.arraycopy(newSeq, 0, tmp, 0, lastCol + 1);

2784

newSeq = tmp;

2785

}

2786

// TODO: optimise SequenceI to avoid char[]->String->char[]

2787

seq.setSequence(String.valueOf(newSeq));

realignedCount++;

}

}

return realignedCount;

}

/**

* If unaligned and aligned sequences share the same dataset sequences, then

2796

* simply copies the aligned sequences to the unaligned sequences and returns

2797

* true; else returns false

2798

2799

* @param unaligned

2800

* - sequences to be aligned based on aligned

2801

* @param aligned

2802

* - 'guide' alignment containing sequences derived from same dataset

* as unaligned

* @return

static boolean alignAsSameSequences(AlignmentI unaligned,

2807

AlignmentI aligned)

2808

{

2809

if (aligned.getDataset() == null || unaligned.getDataset() == null)

2810

{

2811

return false; // should only pass alignments with datasets here

2812

}

2813

2814

// map from dataset sequence to alignment sequence(s)

2815

Map<SequenceI, List<SequenceI>> alignedDatasets = new HashMap<>();

2816

for (SequenceI seq : aligned.getSequences())

2817

{

2818

SequenceI ds = seq.getDatasetSequence();

2819

if (alignedDatasets.get(ds) == null)

2820

{

2821

alignedDatasets.put(ds, new ArrayList<SequenceI>());

2822

}

2823

alignedDatasets.get(ds).add(seq);

}

* first pass - check whether all sequences to be aligned share a

2828

* dataset sequence with an aligned sequence; also note the leftmost

2829

* ungapped column from which to copy

2830

2831

int leftmost = Integer.MAX_VALUE;

2832

for (SequenceI seq : unaligned.getSequences())

2833

{

2834

final SequenceI ds = seq.getDatasetSequence();

2835

if (!alignedDatasets.containsKey(ds))

{

return false;

}

SequenceI alignedSeq = alignedDatasets.get(ds).get(0);

2840

int startCol = alignedSeq.findIndex(seq.getStart()); // 1..

2841

leftmost = Math.min(leftmost, startCol);

}

* second pass - copy aligned sequences;

2846

* heuristic rule: pair off sequences in order for the case where

2847

* more than one shares the same dataset sequence

2848

2849

final char gapCharacter = aligned.getGapCharacter();

2850

for (SequenceI seq : unaligned.getSequences())

2851

{

2852

List<SequenceI> alignedSequences = alignedDatasets

2853

.get(seq.getDatasetSequence());

2854

if (alignedSequences.isEmpty())

2855

{

2856

2857

* defensive check - shouldn't happen! (JAL-3536)

continue;

}

SequenceI alignedSeq = alignedSequences.get(0);

2862

2863

2864

* gap fill for leading (5') UTR if any

2865

2866

// TODO this copies intron columns - wrong!

2867

int startCol = alignedSeq.findIndex(seq.getStart()); // 1..

2868

int endCol = alignedSeq.findIndex(seq.getEnd());

2869

char[] seqchars = new char[endCol - leftmost + 1];

2870

Arrays.fill(seqchars, gapCharacter);

2871

char[] toCopy = alignedSeq.getSequence(startCol - 1, endCol);

2872

System.arraycopy(toCopy, 0, seqchars, startCol - leftmost,

2873

toCopy.length);

2874

seq.setSequence(String.valueOf(seqchars));

2875

if (alignedSequences.size() > 0)

2876

{

2877

// pop off aligned sequences (except the last one)

2878

alignedSequences.remove(0);

}

}

* finally remove gapped columns (e.g. introns)

2884

2885

new RemoveGapColCommand("", unaligned.getSequencesArray(), 0,

2886

unaligned.getWidth() - 1, unaligned);

return true;

}

/**

* Returns a map whose key is alignment column number (base 1), and whose

2893

* values are a map of sequence characters in that column.

* @param unaligned

* @param aligned

* @param unmapped

* @return

static SortedMap<Integer, Map<SequenceI, Character>> buildMappedColumnsMap(

2901

AlignmentI unaligned, AlignmentI aligned,

2902

List<SequenceI> unmapped)

2903

{

2904

2905

* Map will hold, for each aligned column position, a map of

2906

* {unalignedSequence, characterPerSequence} at that position.

2907

* TreeMap keeps the entries in ascending column order.

2908

2909

SortedMap<Integer, Map<SequenceI, Character>> map = new TreeMap<>();

2910

2911

2912

* record any sequences that have no mapping so can't be realigned

2913

2914

unmapped.addAll(unaligned.getSequences());

2915

2916

List<AlignedCodonFrame> mappings = aligned.getCodonFrames();

2917

2918

for (SequenceI seq : unaligned.getSequences())

2919

{

2920

for (AlignedCodonFrame mapping : mappings)

2921

{

2922

518

SequenceI fromSeq = mapping.findAlignedSequence(seq, aligned);

2923

518

if (fromSeq != null)

2924

{

2925

Mapping seqMap = mapping.getMappingBetween(fromSeq, seq);

2926

if (addMappedPositions(seq, fromSeq, seqMap, map))

2927

{

2928

unmapped.remove(seq);

}

}

}

}

return map;

}

/**

* Helper method that adds to a map the mapped column positions of a sequence.

2938

* <br>

2939

* For example if aaTT-Tg-gAAA is mapped to TTTAAA then the map should record

2940

* that columns 3,4,6,10,11,12 map to characters T,T,T,A,A,A of the mapped to

* sequence.

* @param seq

* the sequence whose column positions we are recording

2945

* @param fromSeq

2946

* a sequence that is mapped to the first sequence

2947

* @param seqMap

2948

* the mapping from 'fromSeq' to 'seq'

2949

* @param map

2950

* a map to add the column positions (in fromSeq) of the mapped

* positions of seq

* @return

static boolean addMappedPositions(SequenceI seq, SequenceI fromSeq,

2955

Mapping seqMap, Map<Integer, Map<SequenceI, Character>> map)

{

if (seqMap == null)

{

return false;

}

* invert mapping if it is from unaligned to aligned sequence

2964

2965

if (seqMap.getTo() == fromSeq.getDatasetSequence())

2966

{

2967

seqMap = new Mapping(seq.getDatasetSequence(),

2968

seqMap.getMap().getInverse());

2969

}

2970

2971

int toStart = seq.getStart();

2972

2973

2974

* traverse [start, end, start, end...] ranges in fromSeq

2975

2976

for (int[] fromRange : seqMap.getMap().getFromRanges())

2977

{

2978

for (int i = 0; i < fromRange.length - 1; i += 2)

2979

{

2980

boolean forward = fromRange[i + 1] >= fromRange[i];

2981

2982

2983

* find the range mapped to (sequence positions base 1)

2984

2985

int[] range = seqMap.locateMappedRange(fromRange[i],

fromRange[i + 1]);

if (range == null)

{

jalview.bin.Console.errPrintln("Error in mapping " + seqMap

2990

+ " from " + fromSeq.getName());

2991

return false;

2992

}

2993

int fromCol = fromSeq.findIndex(fromRange[i]);

2994

int mappedCharPos = range[0];

2995

2996

2997

* walk over the 'from' aligned sequence in forward or reverse

2998

* direction; when a non-gap is found, record the column position

2999

* of the next character of the mapped-to sequence; stop when all

3000

* the characters of the range have been counted

3001

3002

2794300

while (mappedCharPos <= range[1] && fromCol <= fromSeq.getLength()

3003

&& fromCol >= 0)

3004

{

3005

2794265

if (!Comparison.isGap(fromSeq.getCharAt(fromCol - 1)))

3006

{

3007

3008

* mapped from sequence has a character in this column

3009

* record the column position for the mapped to character

3010

3011

32014

Map<SequenceI, Character> seqsMap = map.get(fromCol);

3012

32014

if (seqsMap == null)

3013

{

3014

5410

seqsMap = new HashMap<>();

3015

5410

map.put(fromCol, seqsMap);

3016

}

3017

32014

seqsMap.put(seq, seq.getCharAt(mappedCharPos - toStart));

3018

32014

mappedCharPos++;

3019

}

3020

2794265

fromCol += (forward ? 1 : -1);

}

}

}

return true;

}

// strictly temporary hack until proper criteria for aligning protein to cds

3028

// are in place; this is so Ensembl -> fetch xrefs Uniprot aligns the Uniprot

3029

public static boolean looksLikeEnsembl(AlignmentI alignment)

3030

{

3031

for (SequenceI seq : alignment.getSequences())

3032

{

3033

String name = seq.getName();

3034

if (!name.startsWith("ENSG") && !name.startsWith("ENST"))

{

return false;

}

}

return true;

}

/**

* Creates a deep copy of an alignment along with a dataset alignment,

3044

* alignment annotations, representative sequence and hidden columns.

3045

3046

public static AlignmentI deepCopyAlignment(AlignmentI alignment)

3047

{

3048

var alnCpy = new Alignment(alignment);

3049

alnCpy.setGapCharacter(alignment.getGapCharacter());

3050

alnCpy.setDataset(alignment.getDataset());

3051

for (AlignmentAnnotation annotation : alignment.getAlignmentAnnotation())

3052

alnCpy.addAnnotation(new AlignmentAnnotation(annotation));

3053

if (alignment.hasSeqrep())

3054

{

3055

int idx = alignment.findIndex(alignment.getSeqrep());

3056

if (idx >= 0)

3057

alnCpy.setSeqrep(alnCpy.getSequenceAt(idx));

3058

}

3059

if (alignment.getHiddenColumns() != null)

3060

alnCpy.setHiddenColumns(new HiddenColumns(alignment.getHiddenColumns()));

return alnCpy;

}

/**

* This method filters and returns the secondary structure annotations

3066

* in an array of annotations

3067

3068

* @param annotations

3069

* @return array of secondary structure annotations

3070

3071

public static List<AlignmentAnnotation> getSecondaryStructureAnnots(

3072

AlignmentAnnotation[] annotations)

3073

{

3074

List<AlignmentAnnotation> ssAnnotations = new ArrayList<>();

3075

if (annotations == null || annotations.length == 0)

{

return null;

}

synchronized (annotations)

3081

{

3082

for (AlignmentAnnotation aa : annotations)

{

if (aa == null)

{

continue;

}

if (aa.label != null && Constants.SECONDARY_STRUCTURE_LABELS

3090

.containsKey(aa.label))

3091

{

3092

ssAnnotations.add(aa);

}

}

}

return ssAnnotations;

}

public static boolean isSecondaryStructurePresent(

3101

AlignmentAnnotation[] annotations)

3102

{

3103

boolean ssPresent = false;

3104

if (annotations == null || annotations.length == 0)

{

return false;

}

synchronized (annotations)

3110

{

3111

for (AlignmentAnnotation aa : annotations)

{

if (aa == null)

{

continue;

}

// TODO: @RENIA decide what exactly we should be testing for - not

3118

// strings/labels

3119

if (// aa.isValidStruc() || aa.hasIcons ||

3120

(aa.label != null && Constants.SECONDARY_STRUCTURE_LABELS

3121

.containsKey(aa.label)))

{

ssPresent = true;

break;

}

}

}

return ssPresent;

}

public static Color getSecondaryStructureAnnotationColour(char symbol)

3133

{

3134

3135

if (symbol == Constants.COIL)

{

return Color.gray;

}

if (symbol == Constants.SHEET)

{

return Color.green;

}

if (symbol == Constants.HELIX)

{

return Color.red;

}

return Color.white;

}

111449

public static char findSSAnnotationForGivenSeqposition(

3152

AlignmentAnnotation aa, int seqPosition)

3153

{

3154

111446

char ss = '*';

3155

3156

111434

if (aa != null)

3157

{

3158

111455

if (aa.getAnnotationForPosition(seqPosition) != null)

3159

{

3160

57623

Annotation a = aa.getAnnotationForPosition(seqPosition);

3161

57619

ss = a.secondaryStructure;

3162

3163

// There is no representation for coil and it can be either ' ' or null.

3164

57638

if (ss == ' ' || ss == '-')

3165

{

3166

14767

ss = Constants.COIL;

}

}

else

{

53832

ss = Constants.COIL;

}

}

111420

return ss;

3176

}

3177

3178

3872

public static List<String> extractSSSourceInAlignmentAnnotation(

3179

AlignmentAnnotation[] annotations)

3180

{

3181

3182

3872

List<String> ssSources = new ArrayList<>();

3183

3872

Set<String> addedSources = new HashSet<>(); // to keep track of added

3184

// sources

3185

3186

3872

if (annotations == null)

{

return ssSources;

}

3860

for (AlignmentAnnotation aa : annotations)

3192

{

3193

3194

20440

String ssSource = AlignmentAnnotationUtils.extractSSSourceFromAnnotationDescription(aa);

3195

3196

20440

if (ssSource != null && !addedSources.contains(ssSource))

3197

{

3198

298

ssSources.add(ssSource);

3199

298

addedSources.add(ssSource);

}

}

3860

Collections.sort(ssSources);

3204

3205

3860

return ssSources;

}

/**

* Returns secondary structure annotations from the given sequence for a specified source.

3212

* @param seq the sequence

3213

* @param ssSource the source label ("PDB", "JPred")

3214

* @return list of matching annotations

3215

3216

6317931

public static List<AlignmentAnnotation> getAlignmentAnnotationForSource(

3217

SequenceI seq, String ssSource)

3218

{

3219

3220

6317993

List<AlignmentAnnotation> ssAnnots = new ArrayList<AlignmentAnnotation>();

3221

3222

// Iterate through all known secondary structure labels

3223

6318066

for (String ssLabel : Constants.SECONDARY_STRUCTURE_LABELS.keySet())

3224

{

3225

3226

12633741

AlignmentAnnotation[] aa = seq.getAnnotation(ssLabel);

3227

12634062

if (aa != null)

3228

{

3229

// If source is "ALL", include all annotations for this label

3230

189210

if (Constants.SS_ALL_PROVIDERS.equals(ssSource))

3231

{

3232

72020

ssAnnots.addAll(Arrays.asList(aa));

3233

72020

continue;

3234

}

3235

3236

117190

for (AlignmentAnnotation annot : aa)

3237

{

3238

138419

String ssSourceForAnnot = AlignmentAnnotationUtils.extractSSSourceFromAnnotationDescription(

3239

annot);

3240

// Add annotations from the matching source

3241

138419

if (ssSourceForAnnot != null && ssSource.equals(ssSourceForAnnot)

3242

&& annot.isForDisplay())

3243

{

3244

47893

ssAnnots.add(annot);

}

}

}

}

6319126

if (ssAnnots.size() > 0)

3250

{

3251

102148

return ssAnnots;

3252

}

3253

3254

6217122

return null;

}

public static Map<SequenceI, ArrayList<AlignmentAnnotation>> getSequenceAssociatedAlignmentAnnotations(

3259

AlignmentAnnotation[] alignAnnotList, String selectedSSSource)

3260

{

3261

3262

Map<SequenceI, ArrayList<AlignmentAnnotation>> ssAlignmentAnnotationForSequences = new HashMap<SequenceI, ArrayList<AlignmentAnnotation>>();

3263

if (alignAnnotList == null || alignAnnotList.length == 0)

3264

{

3265

return ssAlignmentAnnotationForSequences;

3266

}

3267

3268

for (AlignmentAnnotation aa : alignAnnotList)

3269

{

3270

251

if (aa.sequenceRef == null)

{

continue;

}

219

if (isSecondaryStructureFrom(selectedSSSource, aa))

3276

{

3277

ssAlignmentAnnotationForSequences

3278

.computeIfAbsent(aa.sequenceRef.getDatasetSequence(),

3279

k -> new ArrayList<>())

.add(aa);

}

}

return ssAlignmentAnnotationForSequences;

}

/**

* param alignAnnotation

3290

* @param selectedSSSource

3291

* @return any alignment annotation that matches the given source

3292

3293

public static List<AlignmentAnnotation> getSecondaryStructureAnnotionFor(List<AlignmentAnnotation> alignAnnotation, String selectedSSSource)

3294

{

3295

ArrayList<AlignmentAnnotation> annForSource = new ArrayList();

3296

for (AlignmentAnnotation alan:alignAnnotation)

3297

{

3298

if (isSecondaryStructureFrom(selectedSSSource, alan)) {

3299

annForSource.add(alan);

}

}

return annForSource;

}

/**

* @param selectedSSSource

3308

* @param aa

3309

* @return true if aa is from a provider or all providers as specified by

3310

* selectedSSSource

3311

3312

219

public static boolean isSecondaryStructureFrom(String selectedSSSource,

3313

AlignmentAnnotation aa)

3314

{

3315

3316

219

for (String label : Constants.SECONDARY_STRUCTURE_LABELS.keySet())

3317

{

3318

3319

376

if (label.equals(aa.label))

3320

{

3321

3322

170

if (selectedSSSource.equals(Constants.SS_ALL_PROVIDERS))

{

return true;

}

132

String ssSource = AlignmentAnnotationUtils

3327

.extractSSSourceFromAnnotationDescription(aa);

3328

132

if (ssSource != null && ssSource.equals(selectedSSSource))

{

return true;

}

}

}

141

return false;

3335

}

3336

3337

// Method to get the key for a given provider value

3338

public static String getSecondaryStructureProviderKey(

3339

String providerValue)

3340

{

3341

for (Map.Entry<String, String> entry : Constants.STRUCTURE_PROVIDERS

3342

.entrySet())

3343

{

3344

if (entry.getValue().equals(providerValue))

3345

{

3346

return entry.getKey(); // Return the key (abbreviation) for the matching

// provider value

}

}

return null; // Return null if no match is found

3351

}

3352

3353

public static String reduceLabelLength(String label)

3354

{

3355

// Split the input by " | "

3356

StringBuilder reducedLabel = new StringBuilder();

3357

for (String part:label.split(" \\| ")) {

3358

String nextLabel=part;

3359

for (Entry<String,String> provider:Constants.STRUCTURE_PROVIDERS.entrySet()) {

3360

if (part.equals(provider.getValue())) {

3361

nextLabel = provider.getKey();

3362

}

3363

}

3364

if (reducedLabel.length()>0)

3365

{

3366

reducedLabel.append(" | ");

3367

}

3368

reducedLabel.append(nextLabel);

3369

}

3370

return reducedLabel.toString();

3371

}

3372

3373

596

public static HashMap<String, Color> assignColorsForSecondaryStructureProviders(

3374

List<String> labels)

3375

{

3376

// Loop through each unique label and add it to the map with a colour.

3377

// for (String label : uniqueLabels)

3378

3379

596

HashMap<String, Color> secondaryStructureProviderColorMap = new HashMap<String, Color>();

3380

596

for (String label : labels)

3381

{

3382

// Generate or retrieve a colour for the label.

3383

544

String name = label.toUpperCase(Locale.ROOT).trim();

3384

544

secondaryStructureProviderColorMap.put(name,

3385

ColorUtils.getColourFromNameAndScheme(name, "NONE"));

3386

}

3387

3388

596

return secondaryStructureProviderColorMap;

3389

}

3390

3391

public static int computeMaxShifts(SequenceI[] seqs, ShiftList inserts)

{

int oldwidth = 0;

int p = 0, lastP = 0, lastIns = 0;

3396

for (SequenceI seq : seqs)

3397

{

3398

140

char[] sqs = seq.getSequence();

3399

// System.out.println(seq.getSequenceAsString());

3400

140

if (oldwidth < sqs.length)

3401

{

3402

oldwidth = sqs.length;

3403

}

3404

140

p = 0;

3405

140

lastP = 0;

3406

140

lastIns = 0;

3407

140

int modelOffset = 0; // shift between index and insertions encountered

3408

140

3409

{

3410

53877

if (sqs[p] >= 'a' && sqs[p] <= 'z')

3411

{

3412

2015

if (lastIns == 0)

3413

{

3414

589

lastP = (modelOffset + p) * 2;

3415

}

3416

2015

lastIns++;

}

else

{

51862

if (lastIns > 0)

3421

{

3422

586

inserts.extendShift(lastP, lastIns);

3423

586

modelOffset -= lastIns;

3424

}

3425

51862

lastIns = 0;

3426

}

3427

53877

} while (++p < sqs.length);

3428

140

if (lastIns > 0)

3429

{

3430

inserts.extendShift(lastP, lastIns);

}

}

return oldwidth;

}

/**

* quick and dirty lowercase - to - insert expansion

3438

3439

* @param seqs

3440

* - these will be direcly modified

3441

* @return message indicating how many gaps were inserted.

3442

3443

public static String a3mToMSA(SequenceI[] seqs)

3444

{

3445

String response = "";

3446

ShiftList inserts = new ShiftList();

3447

int oldwidth = computeMaxShifts(seqs, inserts);

3448

3449

int newwidth = insertShifts(seqs,inserts);

3450

if (oldwidth != newwidth)

3451

{

3452

response = "Added " + (newwidth - oldwidth) + " inserts.";

}

return response;

}

public static int insertShifts(SequenceI[] seqs, ShiftList inserts)

3458

{

3459

int newwidth=0;

3460

for (SequenceI seq : seqs)

3461

{

3462

boolean changed=false;

3463

int posShift = 0, totalShift = 0;

3464

for (int[] shift : inserts.getShifts())

3465

{

3466

// locate this shift in the totalShift'ed sequence

3467

5912

posShift = (shift[0] / 2);

3468

5912

int len = shift[1];

3469

3470

// account for any insertions in this sequence

3471

5912

int p = posShift + totalShift;

3472

7021

while (len > 0 && p < seq.getLength()

3473

&& (seq.getCharAt(p) >= 'a' && seq.getCharAt(p) <= 'z'))

3474

{

3475

1109

p++;

3476

1109

len--;

3477

}

3478

// and mark any remaining after the insert

3479

5912

if (len > 0)

3480

{

3481

5670

changed=true;

3482

5670

seq.doInsert(p, len, '-');

3483

}

3484

5912

totalShift += shift[1]; // update shifted positions in this sequence

}

if (changed)

{

seq.sequenceChanged();

3489

}

3490

newwidth = (seq.getLength() > newwidth) ? seq.getLength() : newwidth;

}

return newwidth;

}

}

Coverage Report

File AlignmentUtils.java

Coverage histogram

Code metrics

Classes

Class AlignmentUtils

Class AlignmentUtils.DnaVariant

Contributing tests

Contributing tests

Source view