File Dna.java

Branches:

150

Statements:

371

Methods:

Classes:

LOC:

1,003

NCLOC:

672

Total complexity:

138

Complexity density:

0.37

Statements/Method:

23.19

Methods/Class:

Average method complexity:

8.62

Classes

Class	Line #	Total Statements	Complexity	TOTAL Coverage	Actions
Dna	50	371	138	0.649906965%

Class Dna

Class Dna	Line # 50	Total Statements 371	Complexity 138	TOTAL Coverage 0.649906965%
Dna(AlignViewportI,Iterator<int[]>) Dna(AlignViewportI,Iterator<int[]>)	9999	8.08	1.01	1.0 1.0100%
initContigs() : void initContigs() : void	114114	18.018	3.03	1.0 1.0100%
compareCodonPos(AlignedCodon,AlignedCodon) : int compareCodonPos(AlignedCodon,AlignedCodon) : int	166166	1.01	1.01	1.0 1.0100%
jalview_2_8_2compare(AlignedCodon,AlignedCodon) : int jalview_2_8_2compare(AlignedCodon,AlignedCodon) : int	180180	5.05	7.07	0.0 0.00%
translateCdna(GeneticCodeI) : AlignmentI translateCdna(GeneticCodeI) : AlignmentI	201201	21.021	5.05	0.9655172 0.965517296.6%
canTranslate(SequenceI[],int[]) : boolean canTranslate(SequenceI[],int[]) : boolean	250250	19.019	12.012	0.0 0.00%
translateAlignedAnnotations(AlignmentI,AlignedCodonFrame) : void translateAlignedAnnotations(AlignmentI,AlignedCodonFrame) : void	302302	27.027	15.015	0.12765957 0.1276595712.8%
getCodonAnnotation(AlignedCodon,Annotation[]) : Annotation getCodonAnnotation(AlignedCodon,Annotation[]) : Annotation	375375	22.022	10.010	0.0 0.00%
translateCodingRegion(SequenceI,String,AlignedCodonFrame,List<SequenceI>,GeneticCodeI) : SequenceI translateCodingRegion(SequenceI,String,AlignedCodonFrame,List<SequenceI>,GeneticCodeI) : SequenceI	437437	125.0125	38.038	0.7326203 0.732620373.3%
insertAAGap(int,List<SequenceI>) : void insertAAGap(int,List<SequenceI>) : void	751751	8.08	2.02	0.9 0.990%
checkCodonFrameWidth() : void checkCodonFrameWidth() : void	777777	4.04	2.02	0.33333334 0.3333333433.3%
transferCodedFeatures(SequenceI,SequenceI,MapList) : void transferCodedFeatures(SequenceI,SequenceI,MapList) : void	798798	2.02	2.02	0.25 0.2525%
reverseCdna(boolean) : AlignmentI reverseCdna(boolean) : AlignmentI	834834	10.010	3.03	0.9285714 0.928571492.9%
reverseSequence(String,String,boolean) : SequenceI reverseSequence(String,String,boolean) : SequenceI	865865	12.012	5.05	1.0 1.0100%
reverseComplement(String) : String reverseComplement(String) : String	894894	4.04	2.02	1.0 1.0100%
getComplement(char) : char getComplement(char) : char	912912	85.085	30.030	0.9764706 0.976470697.6%

Contributing tests

This file is covered by 16 tests. .

Contributing tests

Test contribution	Test	Result
0.40037245	jalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsjalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodons	1PASS
0.33705774	jalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsAndHiddenColumnsjalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsAndHiddenColumns	1PASS
0.2700186	jalview.renderer.seqfeatures.FeatureRendererTest.testFindComplementFeaturesAtResiduejalview.renderer.seqfeatures.FeatureRendererTest.testFindComplementFeaturesAtResidue	1PASS
0.26815644	jalview.analysis.DnaTest.testTranslateCdna_sequenceOrderIndependentjalview.analysis.DnaTest.testTranslateCdna_sequenceOrderIndependent	1PASS
0.26443204	jalview.analysis.DnaTest.testTranslateCdna_hiddenColumnsjalview.analysis.DnaTest.testTranslateCdna_hiddenColumns	1PASS
0.26070765	jalview.analysis.DnaTest.testTranslateCdna_simplejalview.analysis.DnaTest.testTranslateCdna_simple	1PASS
0.15270019	jalview.analysis.DnaTest.testGetComplementjalview.analysis.DnaTest.testGetComplement	1PASS
0.12290503	jalview.analysis.DnaTest.testReverseSequencejalview.analysis.DnaTest.testReverseSequence	1PASS
0.11731844	jalview.analysis.DnaTest.testReverseCdnajalview.analysis.DnaTest.testReverseCdna	1PASS
0.05027933	jalview.ext.ensembl.EnsemblSeqProxyTest.testReverseComplementAllelesjalview.ext.ensembl.EnsemblSeqProxyTest.testReverseComplementAlleles	1PASS
0.044692736	jalview.ext.ensembl.EnsemblSeqProxyTest.testReverseComplementAllelejalview.ext.ensembl.EnsemblSeqProxyTest.testReverseComplementAllele	1PASS
0.04283054	jalview.io.vcf.VCFLoaderTest.testDoLoad_reverseStrandjalview.io.vcf.VCFLoaderTest.testDoLoad_reverseStrand	1PASS
0.04283054	jalview.io.vcf.VCFLoaderTest.testDoLoadjalview.io.vcf.VCFLoaderTest.testDoLoad	1PASS
0.0037243948	jalview.analysis.DnaTest.testCompareCodonPosjalview.analysis.DnaTest.testCompareCodonPos	1PASS
0.0037243948	jalview.analysis.DnaTest.testCompareCodonPos_oneOnlyjalview.analysis.DnaTest.testCompareCodonPos_oneOnly	1PASS
0.0037243948	jalview.analysis.DnaTest.testCompareCodonPos_isSymmetricjalview.analysis.DnaTest.testCompareCodonPos_isSymmetric	1PASS

Source view

* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)

* Copyright (C) $$Year-Rel$$ The Jalview Authors

* This file is part of Jalview.

* Jalview is free software: you can redistribute it and/or

* modify it under the terms of the GNU General Public License

* as published by the Free Software Foundation, either version 3

* of the License, or (at your option) any later version.

* Jalview is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty

* of MERCHANTABILITY or FITNESS FOR A PARTICULAR

* PURPOSE. See the GNU General Public License for more details.

* You should have received a copy of the GNU General Public License

* along with Jalview. If not, see <http://www.gnu.org/licenses/>.

* The Jalview Authors are detailed in the 'AUTHORS' file.

package jalview.analysis;

import jalview.api.AlignViewportI;

import jalview.datamodel.AlignedCodon;

import jalview.datamodel.AlignedCodonFrame;

import jalview.datamodel.Alignment;

import jalview.datamodel.AlignmentAnnotation;

import jalview.datamodel.AlignmentI;

import jalview.datamodel.Annotation;

import jalview.datamodel.DBRefEntry;

import jalview.datamodel.DBRefSource;

import jalview.datamodel.FeatureProperties;

import jalview.datamodel.GraphLine;

import jalview.datamodel.Mapping;

import jalview.datamodel.Sequence;

import jalview.datamodel.SequenceFeature;

import jalview.datamodel.SequenceI;

import jalview.schemes.ResidueProperties;

import jalview.util.Comparison;

import jalview.util.DBRefUtils;

import jalview.util.MapList;

import jalview.util.ShiftList;

import java.util.ArrayList;

import java.util.Arrays;

import java.util.Comparator;

import java.util.Iterator;

import java.util.List;

public class Dna

{

private static final String STOP_ASTERIX = "*";

private static final Comparator<AlignedCodon> comparator = new CodonComparator();

* 'final' variables describe the inputs to the translation, which should not

* be modified.

private final List<SequenceI> selection;

private final String[] seqstring;

private final Iterator<int[]> contigs;

private final char gapChar;

private final AlignmentAnnotation[] annotations;

private final int dnaWidth;

private final AlignmentI dataset;

private ShiftList vismapping;

private int[] startcontigs;

* Working variables for the translation.

* The width of the translation-in-progress protein alignment.

private int aaWidth = 0;

* This array will be built up so that position i holds the codon positions

* e.g. [7, 9, 10] that match column i (base 0) in the aligned translation.

* Note this implies a contract that if two codons do not align exactly, their

* translated products must occupy different column positions.

private AlignedCodon[] alignedCodons;

/**

* Constructor given a viewport and the visible contigs.

* @param viewport

* @param visibleContigs

public Dna(AlignViewportI viewport, Iterator<int[]> visibleContigs)

100

{

101

this.selection = Arrays.asList(viewport.getSequenceSelection());

102

this.seqstring = viewport.getViewAsString(true);

103

this.contigs = visibleContigs;

104

this.gapChar = viewport.getGapCharacter();

105

this.annotations = viewport.getAlignment().getAlignmentAnnotation();

106

this.dnaWidth = viewport.getAlignment().getWidth();

107

this.dataset = viewport.getAlignment().getDataset();

initContigs();

}

/**

* Initialise contigs used as starting point for translateCodingRegion

113

114

private void initContigs()

115

{

116

vismapping = new ShiftList(); // map from viscontigs to seqstring

// intervals

int npos = 0;

int[] lastregion = null;

121

ArrayList<Integer> tempcontigs = new ArrayList<>();

122

while (contigs.hasNext())

123

{

124

int[] region = contigs.next();

125

if (lastregion == null)

126

{

127

vismapping.addShift(npos, region[0]);

}

else

{

// hidden region

vismapping.addShift(npos, region[0] - lastregion[1] + 1);

133

}

134

lastregion = region;

135

tempcontigs.add(region[0]);

136

tempcontigs.add(region[1]);

137

}

138

139

startcontigs = new int[tempcontigs.size()];

140

int i = 0;

141

for (Integer val : tempcontigs)

142

{

143

startcontigs[i] = val;

i++;

}

tempcontigs = null;

}

/**

* Test whether codon positions cdp1 should align before, with, or after cdp2.

151

* Returns zero if all positions match (or either argument is null). Returns

152

* -1 if any position in the first codon precedes the corresponding position

153

* in the second codon. Else returns +1 (some position in the second codon

154

* precedes the corresponding position in the first).

155

156

* Note this is not necessarily symmetric, for example:

157

* <ul>

158

* <li>compareCodonPos([2,5,6], [3,4,5]) returns -1</li>

159

* <li>compareCodonPos([3,4,5], [2,5,6]) also returns -1</li>

* </ul>

* @param ac1

* @param ac2

* @return

3347

public static final int compareCodonPos(AlignedCodon ac1, AlignedCodon ac2)

167

{

168

3347

return comparator.compare(ac1, ac2);

169

// return jalview_2_8_2compare(ac1, ac2);

}

/**

* Codon comparison up to Jalview 2.8.2. This rule is sequence order dependent

174

* - see http://issues.jalview.org/browse/JAL-1635

* @param ac1

* @param ac2

* @return

private static int jalview_2_8_2compare(AlignedCodon ac1,

181

AlignedCodon ac2)

182

{

183

if (ac1 == null || ac2 == null || (ac1.equals(ac2)))

{

return 0;

}

if (ac1.pos1 < ac2.pos1 || ac1.pos2 < ac2.pos2 || ac1.pos3 < ac2.pos3)

188

{

189

// one base in cdp1 precedes the corresponding base in the other codon

190

return -1;

191

}

192

// one base in cdp1 appears after the corresponding base in the other codon.

return 1;

}

/**

* Translates cDNA using the specified code table

* @return

public AlignmentI translateCdna(GeneticCodeI codeTable)

202

{

203

AlignedCodonFrame acf = new AlignedCodonFrame();

204

205

alignedCodons = new AlignedCodon[dnaWidth];

206

207

int s;

208

int sSize = selection.size();

209

List<SequenceI> pepseqs = new ArrayList<>();

210

240

for (s = 0; s < sSize; s++)

211

{

212

217

SequenceI newseq = translateCodingRegion(selection.get(s),

213

seqstring[s], acf, pepseqs, codeTable);

214

215

217

if (newseq != null)

216

{

217

pepseqs.add(newseq);

218

217

SequenceI ds = newseq;

219

217

if (dataset != null)

220

{

221

while (ds.getDatasetSequence() != null)

222

{

223

ds = ds.getDatasetSequence();

224

}

225

dataset.addSequence(ds);

}

}

}

SequenceI[] newseqs = pepseqs.toArray(new SequenceI[pepseqs.size()]);

231

AlignmentI al = new Alignment(newseqs);

232

// ensure we look aligned.

233

al.padGaps();

234

// link the protein translation to the DNA dataset

235

al.setDataset(dataset);

236

translateAlignedAnnotations(al, acf);

237

al.addCodonFrame(acf);

return al;

}

/**

* fake the collection of DbRefs with associated exon mappings to identify if

243

* a translation would generate distinct product in the currently selected

* region.

* @param selection

* @param viscontigs

* @return

public static boolean canTranslate(SequenceI[] selection,

251

int viscontigs[])

252

{

253

for (int gd = 0; gd < selection.length; gd++)

254

{

255

SequenceI dna = selection[gd];

256

List<DBRefEntry> dnarefs = DBRefUtils.selectRefs(dna.getDBRefs(),

257

jalview.datamodel.DBRefSource.DNACODINGDBS);

258

if (dnarefs != null)

259

{

260

// intersect with pep

261

List<DBRefEntry> mappedrefs = new ArrayList<>();

262

List<DBRefEntry> refs = dna.getDBRefs();

263

for (int d = 0, nd = refs.size(); d < nd; d++)

264

{

265

DBRefEntry ref = refs.get(d);

266

if (ref.getMap() != null && ref.getMap().getMap() != null

267

&& ref.getMap().getMap().getFromRatio() == 3

268

&& ref.getMap().getMap().getToRatio() == 1)

269

{

270

mappedrefs.add(ref); // add translated protein maps

271

}

272

}

273

dnarefs = mappedrefs;//.toArray(new DBRefEntry[mappedrefs.size()]);

274

for (int d = 0, nd = dnarefs.size(); d < nd; d++)

275

{

276

Mapping mp = dnarefs.get(d).getMap();

277

if (mp != null)

278

{

279

for (int vc = 0, nv = viscontigs.length; vc < nv; vc += 2)

280

{

281

int[] mpr = mp.locateMappedRange(viscontigs[vc],

viscontigs[vc + 1]);

if (mpr != null)

{

return true;

}

}

}

}

}

}

return false;

}

/**

* Translate nucleotide alignment annotations onto translated amino acid

297

* alignment using codon mapping codons

298

299

* @param al

300

* the translated protein alignment

301

302

protected void translateAlignedAnnotations(AlignmentI al,

303

AlignedCodonFrame acf)

304

{

305

// Can only do this for columns with consecutive codons, or where

306

// annotation is sequence associated.

307

308

if (annotations != null)

309

{

310

for (AlignmentAnnotation annotation : annotations)

311

{

312

313

* Skip hidden or autogenerated annotation. Also (for now), RNA

314

* secondary structure annotation. If we want to show this against

315

* protein we need a smarter way to 'translate' without generating

316

* invalid (unbalanced) structure annotation.

317

318

if (annotation.autoCalculated || !annotation.visible

319

|| annotation.isRNA())

320

{

321

318

continue;

}

int aSize = aaWidth;

Annotation[] anots = (annotation.annotations == null) ? null

326

: new Annotation[aSize];

327

if (anots != null)

328

{

329

for (int a = 0; a < aSize; a++)

330

{

331

// process through codon map.

332

if (a < alignedCodons.length && alignedCodons[a] != null

333

&& alignedCodons[a].pos1 == (alignedCodons[a].pos3 - 2))

334

{

335

anots[a] = getCodonAnnotation(alignedCodons[a],

336

annotation.annotations);

}

}

}

AlignmentAnnotation aa = new AlignmentAnnotation(annotation.label,

342

annotation.description, anots);

343

aa.graph = annotation.graph;

344

aa.graphGroup = annotation.graphGroup;

345

aa.graphHeight = annotation.graphHeight;

346

if (annotation.getThreshold() != null)

347

{

348

aa.setThreshold(new GraphLine(annotation.getThreshold()));

349

}

350

if (annotation.hasScore)

351

{

352

aa.setScore(annotation.getScore());

353

}

354

355

final SequenceI seqRef = annotation.sequenceRef;

356

if (seqRef != null)

357

{

358

SequenceI aaSeq = acf.getAaForDnaSeq(seqRef);

359

if (aaSeq != null)

360

{

361

// aa.compactAnnotationArray(); // throw away alignment annotation

362

// positioning

363

aa.setSequenceRef(aaSeq);

364

// rebuild mapping

365

aa.createSequenceMapping(aaSeq, aaSeq.getStart(), true);

366

aa.adjustForAlignment();

367

aaSeq.addAlignmentAnnotation(aa);

368

}

369

}

370

al.addAnnotation(aa);

}

}

}

private static Annotation getCodonAnnotation(AlignedCodon is,

376

Annotation[] annotations)

377

{

378

// Have a look at all the codon positions for annotation and put the first

379

// one found into the translated annotation pos.

380

int contrib = 0;

381

Annotation annot = null;

382

for (int p = 1; p <= 3; p++)

383

{

384

int dnaCol = is.getBaseColumn(p);

385

if (annotations[dnaCol] != null)

{

if (annot == null)

{

annot = new Annotation(annotations[dnaCol]);

contrib = 1;

}

else

{

// merge with last

Annotation cpy = new Annotation(annotations[dnaCol]);

396

if (annot.colour == null)

397

{

398

annot.colour = cpy.colour;

399

}

400

if (annot.description == null || annot.description.length() == 0)

401

{

402

annot.description = cpy.description;

403

}

404

if (annot.displayCharacter == null)

405

{

406

annot.displayCharacter = cpy.displayCharacter;

407

}

408

if (annot.secondaryStructure == 0)

409

{

410

annot.secondaryStructure = cpy.secondaryStructure;

411

}

412

annot.value += cpy.value;

contrib++;

}

}

}

if (contrib > 1)

{

annot.value /= contrib;

}

return annot;

}

/**

* Translate a na sequence

426

427

* @param selection

428

* sequence displayed under viscontigs visible columns

429

* @param seqstring

430

* ORF read in some global alignment reference frame

431

* @param acf

432

* Definition of global ORF alignment reference frame

433

* @param proteinSeqs

434

* @param codeTable

435

* @return sequence ready to be added to alignment.

436

437

217

protected SequenceI translateCodingRegion(SequenceI selection,

438

String seqstring, AlignedCodonFrame acf,

439

List<SequenceI> proteinSeqs, GeneticCodeI codeTable)

440

{

441

217

List<int[]> skip = new ArrayList<>();

442

217

int[] skipint = null;

443

444

217

int npos = 0;

445

217

int vc = 0;

446

447

217

int[] scontigs = new int[startcontigs.length];

448

217

System.arraycopy(startcontigs, 0, scontigs, 0, startcontigs.length);

449

450

// allocate a roughly sized buffer for the protein sequence

451

217

StringBuilder protein = new StringBuilder(seqstring.length() / 2);

452

217

String seq = seqstring.replace('U', 'T').replace('u', 'T');

453

217

char codon[] = new char[3];

454

217

int cdp[] = new int[3];

455

217

int rf = 0;

456

217

int lastnpos = 0;

457

217

int nend;

458

217

int aspos = 0;

459

217

int resSize = 0;

460

6275

for (npos = 0, nend = seq.length(); npos < nend; npos++)

461

{

462

6058

if (!Comparison.isGap(seq.charAt(npos)))

463

{

464

6028

cdp[rf] = npos; // store position

465

6028

codon[rf++] = seq.charAt(npos); // store base

466

}

467

6058

if (rf == 3)

468

{

469

470

* Filled up a reading frame...

471

472

1888

AlignedCodon alignedCodon = new AlignedCodon(cdp[0], cdp[1], cdp[2]);

473

1888

String aa = codeTable.translate(new String(codon));

474

1888

rf = 0;

475

1888

final String gapString = String.valueOf(gapChar);

476

1888

if (aa == null)

{

aa = gapString;

if (skipint == null)

{

skipint = new int[] { alignedCodon.pos1,

alignedCodon.pos3 /*

* cdp[0],

* cdp[2]

*/ };

}

skipint[1] = alignedCodon.pos3; // cdp[2];

}

else

{

1887

if (skipint != null)

492

{

493

// edit scontigs

494

skipint[0] = vismapping.shift(skipint[0]);

495

skipint[1] = vismapping.shift(skipint[1]);

496

for (vc = 0; vc < scontigs.length;)

497

{

498

if (scontigs[vc + 1] < skipint[0])

499

{

500

// before skipint starts

vc += 2;

continue;

}

if (scontigs[vc] > skipint[1])

505

{

506

// finished editing so

507

break;

508

}

509

// Edit the contig list to include the skipped region which did

510

// not translate

511

int[] t;

512

// from : s1 e1 s2 e2 s3 e3

513

// to s: s1 e1 s2 k0 k1 e2 s3 e3

514

// list increases by one unless one boundary (s2==k0 or e2==k1)

515

// matches, and decreases by one if skipint intersects whole

516

// visible contig

517

if (scontigs[vc] <= skipint[0])

518

{

519

if (skipint[0] == scontigs[vc])

520

{

521

// skipint at start of contig

522

// shift the start of this contig

523

if (scontigs[vc + 1] > skipint[1])

524

{

525

scontigs[vc] = skipint[1];

vc += 2;

}

else

{

if (scontigs[vc + 1] == skipint[1])

531

{

532

// remove the contig

533

t = new int[scontigs.length - 2];

534

if (vc > 0)

535

{

536

System.arraycopy(scontigs, 0, t, 0, vc - 1);

537

}

538

if (vc + 2 < t.length)

539

{

540

System.arraycopy(scontigs, vc + 2, t, vc,

t.length - vc + 2);

}

scontigs = t;

}

else

{

// truncate contig to before the skipint region

548

scontigs[vc + 1] = skipint[0] - 1;

vc += 2;

}

}

}

else

{

// scontig starts before start of skipint

556

if (scontigs[vc + 1] < skipint[1])

557

{

558

// skipint truncates end of scontig

559

scontigs[vc + 1] = skipint[0] - 1;

vc += 2;

}

else

{

// divide region to new contigs

565

t = new int[scontigs.length + 2];

566

System.arraycopy(scontigs, 0, t, 0, vc + 1);

567

t[vc + 1] = skipint[0];

568

t[vc + 2] = skipint[1];

569

System.arraycopy(scontigs, vc + 1, t, vc + 3,

570

scontigs.length - (vc + 1));

scontigs = t;

vc += 4;

}

}

}

}

skip.add(skipint);

skipint = null;

}

1887

if (aa.equals(ResidueProperties.STOP))

{

aa = STOP_ASTERIX;

}

1887

resSize++;

585

}

586

1888

boolean findpos = true;

587

5150

while (findpos)

588

{

589

590

* Compare this codon's base positions with those currently aligned to

591

* this column in the translation.

592

593

3262

final int compareCodonPos = compareCodonPos(alignedCodon,

594

alignedCodons[aspos]);

595

3262

switch (compareCodonPos)

596

{

597

178

case -1:

598

599

600

* This codon should precede the mapped positions - need to insert a

601

* gap in all prior sequences.

602

603

178

insertAAGap(aspos, proteinSeqs);

604

178

findpos = false;

605

178

break;

606

607

1374

case +1:

608

609

610

* This codon belongs after the aligned codons at aspos. Prefix it

611

* with a gap and try the next position.

612

613

1374

aa = gapString + aa;

614

1374

aspos++;

615

1374

break;

616

617

1710

case 0:

618

619

620

* Exact match - codon 'belongs' at this translated position.

621

622

1710

findpos = false;

623

}

624

}

625

1888

protein.append(aa);

626

1888

lastnpos = npos;

627

1888

if (alignedCodons[aspos] == null)

628

{

629

// mark this column as aligning to this aligned reading frame

630

466

alignedCodons[aspos] = alignedCodon;

631

}

632

1422

else if (!alignedCodons[aspos].equals(alignedCodon))

633

{

634

throw new IllegalStateException(

635

"Tried to coalign " + alignedCodons[aspos].toString()

636

+ " with " + alignedCodon.toString());

637

}

638

1888

if (aspos >= aaWidth)

639

{

640

// update maximum alignment width

641

449

aaWidth = aspos;

642

}

643

// ready for next translated reading frame alignment position (if any)

644

1888

aspos++;

645

}

646

}

647

217

if (resSize > 0)

648

{

649

217

SequenceI newseq = new Sequence(selection.getName(),

650

protein.toString());

651

217

if (rf != 0)

652

{

653

188

final String errMsg = "trimming contigs for incomplete terminal codon.";

654

188

System.err.println(errMsg);

655

// map and trim contigs to ORF region

656

188

vc = scontigs.length - 1;

657

188

lastnpos = vismapping.shift(lastnpos); // place npos in context of

658

// whole dna alignment (rather

659

// than visible contigs)

660

// incomplete ORF could be broken over one or two visible contig

661

// intervals.

662

376

while (vc >= 0 && scontigs[vc] > lastnpos)

663

{

664

188

if (vc > 0 && scontigs[vc - 1] > lastnpos)

{

vc -= 2;

}

else

{

// correct last interval in list.

671

188

scontigs[vc] = lastnpos;

}

}

188

if (vc > 0 && (vc + 1) < scontigs.length)

676

{

677

// truncate map list to just vc elements

678

int t[] = new int[vc + 1];

679

System.arraycopy(scontigs, 0, t, 0, vc + 1);

680

scontigs = t;

681

}

682

188

if (vc <= 0)

{

scontigs = null;

}

}

217

if (scontigs != null)

688

{

689

217

npos = 0;

690

// map scontigs to actual sequence positions on selection

691

412

for (vc = 0; vc < scontigs.length; vc += 2)

692

{

693

220

scontigs[vc] = selection.findPosition(scontigs[vc]); // not from 1!

694

220

scontigs[vc + 1] = selection.findPosition(scontigs[vc + 1]); // exclusive

695

220

if (scontigs[vc + 1] == selection.getEnd())

{

break;

}

}

// trim trailing empty intervals.

701

217

if ((vc + 2) < scontigs.length)

702

{

703

int t[] = new int[vc + 2];

704

System.arraycopy(scontigs, 0, t, 0, vc + 2);

scontigs = t;

}

* delete intervals in scontigs which are not translated. 1. map skip

709

* into sequence position intervals 2. truncate existing ranges and add

710

* new ranges to exclude untranslated regions. if (skip.size()>0) {

711

* Vector narange = new Vector(); for (vc=0; vc<scontigs.length; vc++) {

712

* narange.addElement(new int[] {scontigs[vc]}); } int sint=0,iv[]; vc =

713

* 0; while (sint<skip.size()) { skipint = (int[]) skip.elementAt(sint);

714

* do { iv = (int[]) narange.elementAt(vc); if (iv[0]>=skipint[0] &&

715

* iv[0]<=skipint[1]) { if (iv[0]==skipint[0]) { // delete beginning of

716

* range } else { // truncate range and create new one if necessary iv =

717

* (int[]) narange.elementAt(vc+1); if (iv[0]<=skipint[1]) { // truncate

718

* range iv[0] = skipint[1]; } else { } } } else if (iv[0]<skipint[0]) {

719

* iv = (int[]) narange.elementAt(vc+1); } } while (iv[0]) } }

720

721

217

MapList map = new MapList(scontigs, new int[] { 1, resSize }, 3, 1);

722

723

217

transferCodedFeatures(selection, newseq, map);

724

725

726

* Construct a dataset sequence for our new peptide.

727

728

217

SequenceI rseq = newseq.deriveSequence();

729

730

731

* Store a mapping (between the dataset sequences for the two

732

* sequences).

733

734

// SIDE-EFFECT: acf stores the aligned sequence reseq; to remove!

735

217

acf.addMap(selection, rseq, map);

736

217

return rseq;

737

}

738

}

739

// register the mapping somehow

return null;

}

/**

* Insert a gap into the aligned proteins and the codon mapping array.

* @param pos

* @param proteinSeqs

* @return

178

protected void insertAAGap(int pos, List<SequenceI> proteinSeqs)

752

{

753

178

aaWidth++;

754

178

for (SequenceI seq : proteinSeqs)

755

{

756

598

seq.insertCharAt(pos, gapChar);

757

}

758

759

178

checkCodonFrameWidth();

760

178

if (pos < aaWidth)

761

{

762

178

aaWidth++;

763

764

765

* Shift from [pos] to the end one to the right, and null out [pos]

766

767

178

System.arraycopy(alignedCodons, pos, alignedCodons, pos + 1,

768

alignedCodons.length - pos - 1);

769

178

alignedCodons[pos] = null;

}

}

/**

* Check the codons array can accommodate a single insertion, if not resize

775

* it.

776

777

178

protected void checkCodonFrameWidth()

778

{

779

178

if (alignedCodons[alignedCodons.length - 1] != null)

780

{

781

782

* arraycopy insertion would bump a filled slot off the end, so expand.

783

784

AlignedCodon[] c = new AlignedCodon[alignedCodons.length + 10];

785

System.arraycopy(alignedCodons, 0, c, 0, alignedCodons.length);

alignedCodons = c;

}

}

/**

* Given a peptide newly translated from a dna sequence, copy over and set any

792

* features on the peptide from the DNA.

* @param dna

* @param pep

* @param map

217

private static void transferCodedFeatures(SequenceI dna, SequenceI pep,

799

MapList map)

800

{

801

// BH 2019.01.25 nop?

802

// List<DBRefEntry> dnarefs = DBRefUtils.selectRefs(dna.getDBRefs(),

803

// DBRefSource.DNACODINGDBS);

804

// if (dnarefs != null)

805

// {

806

// // intersect with pep

807

// for (int d = 0, nd = dnarefs.size(); d < nd; d++)

808

// {

809

// Mapping mp = dnarefs.get(d).getMap();

// if (mp != null)

// {

// }

// }

// }

217

for (SequenceFeature sf : dna.getFeatures().getAllFeatures())

816

{

817

if (FeatureProperties.isCodingFeature(null, sf.getType()))

818

{

819

// if (map.intersectsFrom(sf[f].begin, sf[f].end))

{

}

}

}

}

/**

* Returns an alignment consisting of the reversed (and optionally

829

* complemented) sequences set in this object's constructor

* @param complement

* @return

public AlignmentI reverseCdna(boolean complement)

835

{

836

int sSize = selection.size();

837

List<SequenceI> reversed = new ArrayList<>();

838

for (int s = 0; s < sSize; s++)

839

{

840

SequenceI newseq = reverseSequence(selection.get(s).getName(),

841

seqstring[s], complement);

if (newseq != null)

{

reversed.add(newseq);

}

}

SequenceI[] newseqs = reversed.toArray(new SequenceI[reversed.size()]);

850

AlignmentI al = new Alignment(newseqs);

851

((Alignment) al).createDatasetAlignment();

return al;

}

/**

* Returns a reversed, and optionally complemented, sequence. The new

857

* sequence's name is the original name with "|rev" or "|revcomp" appended.

858

* aAcCgGtT and DNA ambiguity codes are complemented, any other characters are

* left unchanged.

* @param seq

* @param complement

* @return

public static SequenceI reverseSequence(String seqName, String sequence,

866

boolean complement)

867

{

868

String newName = seqName + "|rev" + (complement ? "comp" : "");

869

char[] originalSequence = sequence.toCharArray();

870

int length = originalSequence.length;

871

char[] reversedSequence = new char[length];

872

int bases = 0;

873

for (int i = 0; i < length; i++)

874

{

875

char c = complement ? getComplement(originalSequence[i])

876

: originalSequence[i];

877

reversedSequence[length - i - 1] = c;

878

if (!Comparison.isGap(c))

{

bases++;

}

}

SequenceI reversed = new Sequence(newName, reversedSequence, 1, bases);

return reversed;

}

/**

* Answers the reverse complement of the input string

889

890

* @see #getComplement(char)

* @param s

* @return

public static String reverseComplement(String s)

895

{

896

StringBuilder sb = new StringBuilder(s.length());

897

for (int i = s.length() - 1; i >= 0; i--)

898

{

899

sb.append(Dna.getComplement(s.charAt(i)));

900

}

901

return sb.toString();

}

/**

* Returns dna complement (preserving case) for aAcCgGtTuU. Ambiguity codes

906

* are treated as on http://reverse-complement.com/. Anything else is left

* unchanged.

* @param c

* @return

106

public static char getComplement(char c)

913

{

914

106

char result = c;

915

106

switch (c)

{

case '-':

case '.':

case ' ':

break;

case 'a':

result = 't';

break;

case 'A':

result = 'T';

break;

case 'c':

result = 'g';

break;

case 'C':

result = 'G';

break;

case 'g':

result = 'c';

break;

case 'G':

result = 'C';

break;

case 't':

result = 'a';

break;

case 'T':

result = 'A';

break;

case 'u':

result = 'a';

break;

case 'U':

result = 'A';

break;

case 'r':

result = 'y';

break;

case 'R':

result = 'Y';

break;

case 'y':

result = 'r';

break;

case 'Y':

result = 'R';

break;

case 'k':

result = 'm';

break;

case 'K':

result = 'M';

break;

case 'm':

result = 'k';

break;

case 'M':

result = 'K';

break;

case 'b':

result = 'v';

break;

case 'B':

result = 'V';

break;

case 'v':

result = 'b';

break;

case 'V':

result = 'B';

break;

case 'd':

result = 'h';

break;

case 'D':

result = 'H';

break;

case 'h':

result = 'd';

break;

case 'H':

result = 'D';

break;

}

106

return result;

1002

}

1003

}

Coverage Report

File Dna.java

Coverage histogram

Code metrics

Classes

Class Dna

Contributing tests

Contributing tests

Source view