File Dna.java

Branches:

150

Statements:

371

Methods:

Classes:

LOC:

1,005

NCLOC:

674

Total complexity:

138

Complexity density:

0.37

Statements/Method:

23.19

Methods/Class:

Average method complexity:

8.62

Classes

Class	Line #	Total Statements	Complexity	TOTAL Coverage	Actions
Dna	50	371	138	0.636871563.7%

Class Dna

Class Dna	Line # 50	Total Statements 371	Complexity 138	TOTAL Coverage 0.636871563.7%
Dna(AlignViewportI,Iterator<int[]>) Dna(AlignViewportI,Iterator<int[]>)	9999	8.08	1.01	1.0 1.0100%
initContigs() : void initContigs() : void	114114	18.018	3.03	1.0 1.0100%
compareCodonPos(AlignedCodon,AlignedCodon) : int compareCodonPos(AlignedCodon,AlignedCodon) : int	166166	1.01	1.01	1.0 1.0100%
jalview_2_8_2compare(AlignedCodon,AlignedCodon) : int jalview_2_8_2compare(AlignedCodon,AlignedCodon) : int	181181	5.05	7.07	0.0 0.00%
translateCdna(GeneticCodeI) : AlignmentI translateCdna(GeneticCodeI) : AlignmentI	202202	21.021	5.05	0.9655172 0.965517296.6%
canTranslate(SequenceI[],int[]) : boolean canTranslate(SequenceI[],int[]) : boolean	251251	19.019	12.012	0.0 0.00%
translateAlignedAnnotations(AlignmentI,AlignedCodonFrame) : void translateAlignedAnnotations(AlignmentI,AlignedCodonFrame) : void	303303	27.027	15.015	0.12765957 0.1276595712.8%
getCodonAnnotation(AlignedCodon,Annotation[]) : Annotation getCodonAnnotation(AlignedCodon,Annotation[]) : Annotation	376376	22.022	10.010	0.0 0.00%
translateCodingRegion(SequenceI,String,AlignedCodonFrame,List<SequenceI>,GeneticCodeI) : SequenceI translateCodingRegion(SequenceI,String,AlignedCodonFrame,List<SequenceI>,GeneticCodeI) : SequenceI	438438	125.0125	38.038	0.7326203 0.732620373.3%
insertAAGap(int,List<SequenceI>) : void insertAAGap(int,List<SequenceI>) : void	753753	8.08	2.02	0.9 0.990%
checkCodonFrameWidth() : void checkCodonFrameWidth() : void	779779	4.04	2.02	0.33333334 0.3333333433.3%
transferCodedFeatures(SequenceI,SequenceI,MapList) : void transferCodedFeatures(SequenceI,SequenceI,MapList) : void	800800	2.02	2.02	0.25 0.2525%
reverseCdna(boolean) : AlignmentI reverseCdna(boolean) : AlignmentI	836836	10.010	3.03	0.9285714 0.928571492.9%
reverseSequence(String,String,boolean) : SequenceI reverseSequence(String,String,boolean) : SequenceI	867867	12.012	5.05	1.0 1.0100%
reverseComplement(String) : String reverseComplement(String) : String	896896	4.04	2.02	0.0 0.00%
getComplement(char) : char getComplement(char) : char	914914	85.085	30.030	0.9764706 0.976470697.6%

Contributing tests

This file is covered by 14 tests. .

Contributing tests

Test contribution	Test	Result
0.40037245	jalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsjalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodons	1PASS
0.33705774	jalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsAndHiddenColumnsjalview.analysis.DnaTest.testTranslateCdna_withUntranslatableCodonsAndHiddenColumns	1PASS
0.2700186	jalview.renderer.seqfeatures.FeatureRendererTest.testFindComplementFeaturesAtResiduejalview.renderer.seqfeatures.FeatureRendererTest.testFindComplementFeaturesAtResidue	1PASS
0.26815644	jalview.analysis.DnaTest.testTranslateCdna_sequenceOrderIndependentjalview.analysis.DnaTest.testTranslateCdna_sequenceOrderIndependent	1PASS
0.26443204	jalview.analysis.DnaTest.testTranslateCdna_hiddenColumnsjalview.analysis.DnaTest.testTranslateCdna_hiddenColumns	1PASS
0.26070765	jalview.analysis.DnaTest.testTranslateCdna_simplejalview.analysis.DnaTest.testTranslateCdna_simple	1PASS
0.15270019	jalview.analysis.DnaTest.testGetComplementjalview.analysis.DnaTest.testGetComplement	1PASS
0.12290503	jalview.analysis.DnaTest.testReverseSequencejalview.analysis.DnaTest.testReverseSequence	1PASS
0.11731844	jalview.analysis.DnaTest.testReverseCdnajalview.analysis.DnaTest.testReverseCdna	1PASS
0.05027933	jalview.ext.ensembl.EnsemblSeqProxyTest.testReverseComplementAllelesjalview.ext.ensembl.EnsemblSeqProxyTest.testReverseComplementAlleles	1PASS
0.044692736	jalview.ext.ensembl.EnsemblSeqProxyTest.testReverseComplementAllelejalview.ext.ensembl.EnsemblSeqProxyTest.testReverseComplementAllele	1PASS
0.0037243948	jalview.analysis.DnaTest.testCompareCodonPosjalview.analysis.DnaTest.testCompareCodonPos	1PASS
0.0037243948	jalview.analysis.DnaTest.testCompareCodonPos_oneOnlyjalview.analysis.DnaTest.testCompareCodonPos_oneOnly	1PASS
0.0037243948	jalview.analysis.DnaTest.testCompareCodonPos_isSymmetricjalview.analysis.DnaTest.testCompareCodonPos_isSymmetric	1PASS

Source view

* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)

* Copyright (C) $$Year-Rel$$ The Jalview Authors

* This file is part of Jalview.

* Jalview is free software: you can redistribute it and/or

* modify it under the terms of the GNU General Public License

* as published by the Free Software Foundation, either version 3

* of the License, or (at your option) any later version.

* Jalview is distributed in the hope that it will be useful, but

* WITHOUT ANY WARRANTY; without even the implied warranty

* of MERCHANTABILITY or FITNESS FOR A PARTICULAR

* PURPOSE. See the GNU General Public License for more details.

* You should have received a copy of the GNU General Public License

* along with Jalview. If not, see <http://www.gnu.org/licenses/>.

* The Jalview Authors are detailed in the 'AUTHORS' file.

package jalview.analysis;

import jalview.api.AlignViewportI;

import jalview.datamodel.AlignedCodon;

import jalview.datamodel.AlignedCodonFrame;

import jalview.datamodel.Alignment;

import jalview.datamodel.AlignmentAnnotation;

import jalview.datamodel.AlignmentI;

import jalview.datamodel.Annotation;

import jalview.datamodel.DBRefEntry;

import jalview.datamodel.DBRefSource;

import jalview.datamodel.FeatureProperties;

import jalview.datamodel.GraphLine;

import jalview.datamodel.Mapping;

import jalview.datamodel.Sequence;

import jalview.datamodel.SequenceFeature;

import jalview.datamodel.SequenceI;

import jalview.schemes.ResidueProperties;

import jalview.util.Comparison;

import jalview.util.DBRefUtils;

import jalview.util.MapList;

import jalview.util.ShiftList;

import java.util.ArrayList;

import java.util.Arrays;

import java.util.Comparator;

import java.util.Iterator;

import java.util.List;

public class Dna

{

private static final String STOP_ASTERIX = "*";

private static final Comparator<AlignedCodon> comparator = new CodonComparator();

* 'final' variables describe the inputs to the translation, which should not

* be modified.

private final List<SequenceI> selection;

private final String[] seqstring;

private final Iterator<int[]> contigs;

private final char gapChar;

private final AlignmentAnnotation[] annotations;

private final int dnaWidth;

private final AlignmentI dataset;

private ShiftList vismapping;

private int[] startcontigs;

* Working variables for the translation.

* The width of the translation-in-progress protein alignment.

private int aaWidth = 0;

* This array will be built up so that position i holds the codon positions

* e.g. [7, 9, 10] that match column i (base 0) in the aligned translation.

* Note this implies a contract that if two codons do not align exactly, their

* translated products must occupy different column positions.

private AlignedCodon[] alignedCodons;

/**

* Constructor given a viewport and the visible contigs.

* @param viewport

* @param visibleContigs

public Dna(AlignViewportI viewport, Iterator<int[]> visibleContigs)

100

{

101

this.selection = Arrays.asList(viewport.getSequenceSelection());

102

this.seqstring = viewport.getViewAsString(true);

103

this.contigs = visibleContigs;

104

this.gapChar = viewport.getGapCharacter();

105

this.annotations = viewport.getAlignment().getAlignmentAnnotation();

106

this.dnaWidth = viewport.getAlignment().getWidth();

107

this.dataset = viewport.getAlignment().getDataset();

initContigs();

}

/**

* Initialise contigs used as starting point for translateCodingRegion

113

114

private void initContigs()

115

{

116

vismapping = new ShiftList(); // map from viscontigs to seqstring

// intervals

int npos = 0;

int[] lastregion = null;

121

ArrayList<Integer> tempcontigs = new ArrayList<>();

122

while (contigs.hasNext())

123

{

124

int[] region = contigs.next();

125

if (lastregion == null)

126

{

127

vismapping.addShift(npos, region[0]);

}

else

{

// hidden region

vismapping.addShift(npos, region[0] - lastregion[1] + 1);

133

}

134

lastregion = region;

135

tempcontigs.add(region[0]);

136

tempcontigs.add(region[1]);

137

}

138

139

startcontigs = new int[tempcontigs.size()];

140

int i = 0;

141

for (Integer val : tempcontigs)

142

{

143

startcontigs[i] = val;

i++;

}

tempcontigs = null;

}

/**

* Test whether codon positions cdp1 should align before, with, or after cdp2.

151

* Returns zero if all positions match (or either argument is null). Returns

152

* -1 if any position in the first codon precedes the corresponding position

153

* in the second codon. Else returns +1 (some position in the second codon

154

* precedes the corresponding position in the first).

155

156

* Note this is not necessarily symmetric, for example:

157

* <ul>

158

* <li>compareCodonPos([2,5,6], [3,4,5]) returns -1</li>

159

* <li>compareCodonPos([3,4,5], [2,5,6]) also returns -1</li>

* </ul>

* @param ac1

* @param ac2

* @return

3347

public static final int compareCodonPos(AlignedCodon ac1,

167

AlignedCodon ac2)

168

{

169

3347

return comparator.compare(ac1, ac2);

170

// return jalview_2_8_2compare(ac1, ac2);

}

/**

* Codon comparison up to Jalview 2.8.2. This rule is sequence order dependent

175

* - see http://issues.jalview.org/browse/JAL-1635

* @param ac1

* @param ac2

* @return

private static int jalview_2_8_2compare(AlignedCodon ac1,

182

AlignedCodon ac2)

183

{

184

if (ac1 == null || ac2 == null || (ac1.equals(ac2)))

{

return 0;

}

if (ac1.pos1 < ac2.pos1 || ac1.pos2 < ac2.pos2 || ac1.pos3 < ac2.pos3)

189

{

190

// one base in cdp1 precedes the corresponding base in the other codon

191

return -1;

192

}

193

// one base in cdp1 appears after the corresponding base in the other codon.

return 1;

}

/**

* Translates cDNA using the specified code table

* @return

public AlignmentI translateCdna(GeneticCodeI codeTable)

203

{

204

AlignedCodonFrame acf = new AlignedCodonFrame();

205

206

alignedCodons = new AlignedCodon[dnaWidth];

207

208

int s;

209

int sSize = selection.size();

210

List<SequenceI> pepseqs = new ArrayList<>();

211

240

for (s = 0; s < sSize; s++)

212

{

213

217

SequenceI newseq = translateCodingRegion(selection.get(s),

214

seqstring[s], acf, pepseqs, codeTable);

215

216

217

if (newseq != null)

217

{

218

217

pepseqs.add(newseq);

219

217

SequenceI ds = newseq;

220

217

if (dataset != null)

221

{

222

while (ds.getDatasetSequence() != null)

223

{

224

ds = ds.getDatasetSequence();

225

}

226

dataset.addSequence(ds);

}

}

}

SequenceI[] newseqs = pepseqs.toArray(new SequenceI[pepseqs.size()]);

232

AlignmentI al = new Alignment(newseqs);

233

// ensure we look aligned.

234

al.padGaps();

235

// link the protein translation to the DNA dataset

236

al.setDataset(dataset);

237

translateAlignedAnnotations(al, acf);

238

al.addCodonFrame(acf);

return al;

}

/**

* fake the collection of DbRefs with associated exon mappings to identify if

244

* a translation would generate distinct product in the currently selected

* region.

* @param selection

* @param viscontigs

* @return

public static boolean canTranslate(SequenceI[] selection,

252

int viscontigs[])

253

{

254

for (int gd = 0; gd < selection.length; gd++)

255

{

256

SequenceI dna = selection[gd];

257

List<DBRefEntry> dnarefs = DBRefUtils.selectRefs(dna.getDBRefs(),

258

jalview.datamodel.DBRefSource.DNACODINGDBS);

259

if (dnarefs != null)

260

{

261

// intersect with pep

262

List<DBRefEntry> mappedrefs = new ArrayList<>();

263

List<DBRefEntry> refs = dna.getDBRefs();

264

for (int d = 0, nd = refs.size(); d < nd; d++)

265

{

266

DBRefEntry ref = refs.get(d);

267

if (ref.getMap() != null && ref.getMap().getMap() != null

268

&& ref.getMap().getMap().getFromRatio() == 3

269

&& ref.getMap().getMap().getToRatio() == 1)

270

{

271

mappedrefs.add(ref); // add translated protein maps

272

}

273

}

274

dnarefs = mappedrefs;// .toArray(new DBRefEntry[mappedrefs.size()]);

275

for (int d = 0, nd = dnarefs.size(); d < nd; d++)

276

{

277

Mapping mp = dnarefs.get(d).getMap();

278

if (mp != null)

279

{

280

for (int vc = 0, nv = viscontigs.length; vc < nv; vc += 2)

281

{

282

int[] mpr = mp.locateMappedRange(viscontigs[vc],

viscontigs[vc + 1]);

if (mpr != null)

{

return true;

}

}

}

}

}

}

return false;

}

/**

* Translate nucleotide alignment annotations onto translated amino acid

298

* alignment using codon mapping codons

299

300

* @param al

301

* the translated protein alignment

302

303

protected void translateAlignedAnnotations(AlignmentI al,

304

AlignedCodonFrame acf)

305

{

306

// Can only do this for columns with consecutive codons, or where

307

// annotation is sequence associated.

308

309

if (annotations != null)

310

{

311

for (AlignmentAnnotation annotation : annotations)

312

{

313

314

* Skip hidden or autogenerated annotation. Also (for now), RNA

315

* secondary structure annotation. If we want to show this against

316

* protein we need a smarter way to 'translate' without generating

317

* invalid (unbalanced) structure annotation.

318

319

318

if (annotation.autoCalculated || !annotation.isForDisplay()

320

|| annotation.isRNA())

321

{

322

318

continue;

}

int aSize = aaWidth;

Annotation[] anots = (annotation.annotations == null) ? null

327

: new Annotation[aSize];

328

if (anots != null)

329

{

330

for (int a = 0; a < aSize; a++)

331

{

332

// process through codon map.

333

if (a < alignedCodons.length && alignedCodons[a] != null

334

&& alignedCodons[a].pos1 == (alignedCodons[a].pos3 - 2))

335

{

336

anots[a] = getCodonAnnotation(alignedCodons[a],

337

annotation.annotations);

}

}

}

AlignmentAnnotation aa = new AlignmentAnnotation(annotation.label,

343

annotation.description, anots);

344

aa.graph = annotation.graph;

345

aa.graphGroup = annotation.graphGroup;

346

aa.graphHeight = annotation.graphHeight;

347

if (annotation.getThreshold() != null)

348

{

349

aa.setThreshold(new GraphLine(annotation.getThreshold()));

350

}

351

if (annotation.hasScore)

352

{

353

aa.setScore(annotation.getScore());

354

}

355

356

final SequenceI seqRef = annotation.sequenceRef;

357

if (seqRef != null)

358

{

359

SequenceI aaSeq = acf.getAaForDnaSeq(seqRef);

360

if (aaSeq != null)

361

{

362

// aa.compactAnnotationArray(); // throw away alignment annotation

363

// positioning

364

aa.setSequenceRef(aaSeq);

365

// rebuild mapping

366

aa.createSequenceMapping(aaSeq, aaSeq.getStart(), true);

367

aa.adjustForAlignment();

368

aaSeq.addAlignmentAnnotation(aa);

369

}

370

}

371

al.addAnnotation(aa);

}

}

}

private static Annotation getCodonAnnotation(AlignedCodon is,

377

Annotation[] annotations)

378

{

379

// Have a look at all the codon positions for annotation and put the first

380

// one found into the translated annotation pos.

381

int contrib = 0;

382

Annotation annot = null;

383

for (int p = 1; p <= 3; p++)

384

{

385

int dnaCol = is.getBaseColumn(p);

386

if (annotations[dnaCol] != null)

{

if (annot == null)

{

annot = new Annotation(annotations[dnaCol]);

contrib = 1;

}

else

{

// merge with last

Annotation cpy = new Annotation(annotations[dnaCol]);

397

if (annot.colour == null)

398

{

399

annot.colour = cpy.colour;

400

}

401

if (annot.description == null || annot.description.length() == 0)

402

{

403

annot.description = cpy.description;

404

}

405

if (annot.displayCharacter == null)

406

{

407

annot.displayCharacter = cpy.displayCharacter;

408

}

409

if (annot.secondaryStructure == 0)

410

{

411

annot.secondaryStructure = cpy.secondaryStructure;

412

}

413

annot.value += cpy.value;

contrib++;

}

}

}

if (contrib > 1)

{

annot.value /= contrib;

}

return annot;

}

/**

* Translate a na sequence

427

428

* @param selection

429

* sequence displayed under viscontigs visible columns

430

* @param seqstring

431

* ORF read in some global alignment reference frame

432

* @param acf

433

* Definition of global ORF alignment reference frame

434

* @param proteinSeqs

435

* @param codeTable

436

* @return sequence ready to be added to alignment.

437

438

217

protected SequenceI translateCodingRegion(SequenceI selection,

439

String seqstring, AlignedCodonFrame acf,

440

List<SequenceI> proteinSeqs, GeneticCodeI codeTable)

441

{

442

217

List<int[]> skip = new ArrayList<>();

443

217

int[] skipint = null;

444

445

217

int npos = 0;

446

217

int vc = 0;

447

448

217

int[] scontigs = new int[startcontigs.length];

449

217

System.arraycopy(startcontigs, 0, scontigs, 0, startcontigs.length);

450

451

// allocate a roughly sized buffer for the protein sequence

452

217

StringBuilder protein = new StringBuilder(seqstring.length() / 2);

453

217

String seq = seqstring.replace('U', 'T').replace('u', 'T');

454

217

char codon[] = new char[3];

455

217

int cdp[] = new int[3];

456

217

int rf = 0;

457

217

int lastnpos = 0;

458

217

int nend;

459

217

int aspos = 0;

460

217

int resSize = 0;

461

6275

for (npos = 0, nend = seq.length(); npos < nend; npos++)

462

{

463

6058

if (!Comparison.isGap(seq.charAt(npos)))

464

{

465

6028

cdp[rf] = npos; // store position

466

6028

codon[rf++] = seq.charAt(npos); // store base

467

}

468

6058

if (rf == 3)

469

{

470

471

* Filled up a reading frame...

472

473

1888

AlignedCodon alignedCodon = new AlignedCodon(cdp[0], cdp[1],

474

cdp[2]);

475

1888

String aa = codeTable.translate(new String(codon));

476

1888

rf = 0;

477

1888

final String gapString = String.valueOf(gapChar);

478

1888

if (aa == null)

{

aa = gapString;

if (skipint == null)

{

skipint = new int[] { alignedCodon.pos1,

alignedCodon.pos3 /*

* cdp[0],

* cdp[2]

*/ };

}

skipint[1] = alignedCodon.pos3; // cdp[2];

}

else

{

1887

if (skipint != null)

494

{

495

// edit scontigs

496

skipint[0] = vismapping.shift(skipint[0]);

497

skipint[1] = vismapping.shift(skipint[1]);

498

for (vc = 0; vc < scontigs.length;)

499

{

500

if (scontigs[vc + 1] < skipint[0])

501

{

502

// before skipint starts

vc += 2;

continue;

}

if (scontigs[vc] > skipint[1])

507

{

508

// finished editing so

509

break;

510

}

511

// Edit the contig list to include the skipped region which did

512

// not translate

513

int[] t;

514

// from : s1 e1 s2 e2 s3 e3

515

// to s: s1 e1 s2 k0 k1 e2 s3 e3

516

// list increases by one unless one boundary (s2==k0 or e2==k1)

517

// matches, and decreases by one if skipint intersects whole

518

// visible contig

519

if (scontigs[vc] <= skipint[0])

520

{

521

if (skipint[0] == scontigs[vc])

522

{

523

// skipint at start of contig

524

// shift the start of this contig

525

if (scontigs[vc + 1] > skipint[1])

526

{

527

scontigs[vc] = skipint[1];

vc += 2;

}

else

{

if (scontigs[vc + 1] == skipint[1])

533

{

534

// remove the contig

535

t = new int[scontigs.length - 2];

536

if (vc > 0)

537

{

538

System.arraycopy(scontigs, 0, t, 0, vc - 1);

539

}

540

if (vc + 2 < t.length)

541

{

542

System.arraycopy(scontigs, vc + 2, t, vc,

t.length - vc + 2);

}

scontigs = t;

}

else

{

// truncate contig to before the skipint region

550

scontigs[vc + 1] = skipint[0] - 1;

vc += 2;

}

}

}

else

{

// scontig starts before start of skipint

558

if (scontigs[vc + 1] < skipint[1])

559

{

560

// skipint truncates end of scontig

561

scontigs[vc + 1] = skipint[0] - 1;

vc += 2;

}

else

{

// divide region to new contigs

567

t = new int[scontigs.length + 2];

568

System.arraycopy(scontigs, 0, t, 0, vc + 1);

569

t[vc + 1] = skipint[0];

570

t[vc + 2] = skipint[1];

571

System.arraycopy(scontigs, vc + 1, t, vc + 3,

572

scontigs.length - (vc + 1));

scontigs = t;

vc += 4;

}

}

}

}

skip.add(skipint);

skipint = null;

}

1887

if (aa.equals(ResidueProperties.STOP))

{

aa = STOP_ASTERIX;

}

1887

resSize++;

587

}

588

1888

boolean findpos = true;

589

5150

while (findpos)

590

{

591

592

* Compare this codon's base positions with those currently aligned to

593

* this column in the translation.

594

595

3262

final int compareCodonPos = compareCodonPos(alignedCodon,

596

alignedCodons[aspos]);

597

3262

switch (compareCodonPos)

598

{

599

178

case -1:

600

601

602

* This codon should precede the mapped positions - need to insert a

603

* gap in all prior sequences.

604

605

178

insertAAGap(aspos, proteinSeqs);

606

178

findpos = false;

607

178

break;

608

609

1374

case +1:

610

611

612

* This codon belongs after the aligned codons at aspos. Prefix it

613

* with a gap and try the next position.

614

615

1374

aa = gapString + aa;

616

1374

aspos++;

617

1374

break;

618

619

1710

case 0:

620

621

622

* Exact match - codon 'belongs' at this translated position.

623

624

1710

findpos = false;

625

}

626

}

627

1888

protein.append(aa);

628

1888

lastnpos = npos;

629

1888

if (alignedCodons[aspos] == null)

630

{

631

// mark this column as aligning to this aligned reading frame

632

466

alignedCodons[aspos] = alignedCodon;

633

}

634

1422

else if (!alignedCodons[aspos].equals(alignedCodon))

635

{

636

throw new IllegalStateException(

637

"Tried to coalign " + alignedCodons[aspos].toString()

638

+ " with " + alignedCodon.toString());

639

}

640

1888

if (aspos >= aaWidth)

641

{

642

// update maximum alignment width

643

449

aaWidth = aspos;

644

}

645

// ready for next translated reading frame alignment position (if any)

646

1888

aspos++;

647

}

648

}

649

217

if (resSize > 0)

650

{

651

217

SequenceI newseq = new Sequence(selection.getName(),

652

protein.toString());

653

217

if (rf != 0)

654

{

655

188

final String errMsg = "trimming contigs for incomplete terminal codon.";

656

188

jalview.bin.Console.errPrintln(errMsg);

657

// map and trim contigs to ORF region

658

188

vc = scontigs.length - 1;

659

188

lastnpos = vismapping.shift(lastnpos); // place npos in context of

660

// whole dna alignment (rather

661

// than visible contigs)

662

// incomplete ORF could be broken over one or two visible contig

663

// intervals.

664

376

while (vc >= 0 && scontigs[vc] > lastnpos)

665

{

666

188

if (vc > 0 && scontigs[vc - 1] > lastnpos)

{

vc -= 2;

}

else

{

// correct last interval in list.

673

188

scontigs[vc] = lastnpos;

}

}

188

if (vc > 0 && (vc + 1) < scontigs.length)

678

{

679

// truncate map list to just vc elements

680

int t[] = new int[vc + 1];

681

System.arraycopy(scontigs, 0, t, 0, vc + 1);

682

scontigs = t;

683

}

684

188

if (vc <= 0)

{

scontigs = null;

}

}

217

if (scontigs != null)

690

{

691

217

npos = 0;

692

// map scontigs to actual sequence positions on selection

693

412

for (vc = 0; vc < scontigs.length; vc += 2)

694

{

695

220

scontigs[vc] = selection.findPosition(scontigs[vc]); // not from 1!

696

220

scontigs[vc + 1] = selection.findPosition(scontigs[vc + 1]); // exclusive

697

220

if (scontigs[vc + 1] == selection.getEnd())

{

break;

}

}

// trim trailing empty intervals.

703

217

if ((vc + 2) < scontigs.length)

704

{

705

int t[] = new int[vc + 2];

706

System.arraycopy(scontigs, 0, t, 0, vc + 2);

scontigs = t;

}

* delete intervals in scontigs which are not translated. 1. map skip

711

* into sequence position intervals 2. truncate existing ranges and add

712

* new ranges to exclude untranslated regions. if (skip.size()>0) {

713

* Vector narange = new Vector(); for (vc=0; vc<scontigs.length; vc++) {

714

* narange.addElement(new int[] {scontigs[vc]}); } int sint=0,iv[]; vc =

715

* 0; while (sint<skip.size()) { skipint = (int[]) skip.elementAt(sint);

716

* do { iv = (int[]) narange.elementAt(vc); if (iv[0]>=skipint[0] &&

717

* iv[0]<=skipint[1]) { if (iv[0]==skipint[0]) { // delete beginning of

718

* range } else { // truncate range and create new one if necessary iv =

719

* (int[]) narange.elementAt(vc+1); if (iv[0]<=skipint[1]) { // truncate

720

* range iv[0] = skipint[1]; } else { } } } else if (iv[0]<skipint[0]) {

721

* iv = (int[]) narange.elementAt(vc+1); } } while (iv[0]) } }

722

723

217

MapList map = new MapList(scontigs, new int[] { 1, resSize }, 3, 1);

724

725

217

transferCodedFeatures(selection, newseq, map);

726

727

728

* Construct a dataset sequence for our new peptide.

729

730

217

SequenceI rseq = newseq.deriveSequence();

731

732

733

* Store a mapping (between the dataset sequences for the two

734

* sequences).

735

736

// SIDE-EFFECT: acf stores the aligned sequence reseq; to remove!

737

217

acf.addMap(selection, rseq, map);

738

217

return rseq;

739

}

740

}

741

// register the mapping somehow

return null;

}

/**

* Insert a gap into the aligned proteins and the codon mapping array.

* @param pos

* @param proteinSeqs

* @return

178

protected void insertAAGap(int pos, List<SequenceI> proteinSeqs)

754

{

755

178

aaWidth++;

756

178

for (SequenceI seq : proteinSeqs)

757

{

758

598

seq.insertCharAt(pos, gapChar);

759

}

760

761

178

checkCodonFrameWidth();

762

178

if (pos < aaWidth)

763

{

764

178

aaWidth++;

765

766

767

* Shift from [pos] to the end one to the right, and null out [pos]

768

769

178

System.arraycopy(alignedCodons, pos, alignedCodons, pos + 1,

770

alignedCodons.length - pos - 1);

771

178

alignedCodons[pos] = null;

}

}

/**

* Check the codons array can accommodate a single insertion, if not resize

777

* it.

778

779

178

protected void checkCodonFrameWidth()

780

{

781

178

if (alignedCodons[alignedCodons.length - 1] != null)

782

{

783

784

* arraycopy insertion would bump a filled slot off the end, so expand.

785

786

AlignedCodon[] c = new AlignedCodon[alignedCodons.length + 10];

787

System.arraycopy(alignedCodons, 0, c, 0, alignedCodons.length);

alignedCodons = c;

}

}

/**

* Given a peptide newly translated from a dna sequence, copy over and set any

794

* features on the peptide from the DNA.

* @param dna

* @param pep

* @param map

217

private static void transferCodedFeatures(SequenceI dna, SequenceI pep,

801

MapList map)

802

{

803

// BH 2019.01.25 nop?

804

// List<DBRefEntry> dnarefs = DBRefUtils.selectRefs(dna.getDBRefs(),

805

// DBRefSource.DNACODINGDBS);

806

// if (dnarefs != null)

807

// {

808

// // intersect with pep

809

// for (int d = 0, nd = dnarefs.size(); d < nd; d++)

810

// {

811

// Mapping mp = dnarefs.get(d).getMap();

// if (mp != null)

// {

// }

// }

// }

217

for (SequenceFeature sf : dna.getFeatures().getAllFeatures())

818

{

819

if (FeatureProperties.isCodingFeature(null, sf.getType()))

820

{

821

// if (map.intersectsFrom(sf[f].begin, sf[f].end))

{

}

}

}

}

/**

* Returns an alignment consisting of the reversed (and optionally

831

* complemented) sequences set in this object's constructor

* @param complement

* @return

public AlignmentI reverseCdna(boolean complement)

837

{

838

int sSize = selection.size();

839

List<SequenceI> reversed = new ArrayList<>();

840

for (int s = 0; s < sSize; s++)

841

{

842

SequenceI newseq = reverseSequence(selection.get(s).getName(),

843

seqstring[s], complement);

if (newseq != null)

{

reversed.add(newseq);

}

}

SequenceI[] newseqs = reversed.toArray(new SequenceI[reversed.size()]);

852

AlignmentI al = new Alignment(newseqs);

853

((Alignment) al).createDatasetAlignment();

return al;

}

/**

* Returns a reversed, and optionally complemented, sequence. The new

859

* sequence's name is the original name with "|rev" or "|revcomp" appended.

860

* aAcCgGtT and DNA ambiguity codes are complemented, any other characters are

* left unchanged.

* @param seq

* @param complement

* @return

public static SequenceI reverseSequence(String seqName, String sequence,

868

boolean complement)

869

{

870

String newName = seqName + "|rev" + (complement ? "comp" : "");

871

char[] originalSequence = sequence.toCharArray();

872

int length = originalSequence.length;

873

char[] reversedSequence = new char[length];

874

int bases = 0;

875

for (int i = 0; i < length; i++)

876

{

877

char c = complement ? getComplement(originalSequence[i])

878

: originalSequence[i];

879

reversedSequence[length - i - 1] = c;

880

if (!Comparison.isGap(c))

{

bases++;

}

}

SequenceI reversed = new Sequence(newName, reversedSequence, 1, bases);

return reversed;

}

/**

* Answers the reverse complement of the input string

891

892

* @see #getComplement(char)

* @param s

* @return

public static String reverseComplement(String s)

897

{

898

StringBuilder sb = new StringBuilder(s.length());

899

for (int i = s.length() - 1; i >= 0; i--)

900

{

901

sb.append(Dna.getComplement(s.charAt(i)));

902

}

903

return sb.toString();

}

/**

* Returns dna complement (preserving case) for aAcCgGtTuU. Ambiguity codes

908

* are treated as on http://reverse-complement.com/. Anything else is left

* unchanged.

* @param c

* @return

public static char getComplement(char c)

{

char result = c;

switch (c)

{

case '-':

case '.':

case ' ':

break;

case 'a':

result = 't';

break;

case 'A':

result = 'T';

break;

case 'c':

result = 'g';

break;

case 'C':

result = 'G';

break;

case 'g':

result = 'c';

break;

case 'G':

result = 'C';

break;

case 't':

result = 'a';

break;

case 'T':

result = 'A';

break;

case 'u':

result = 'a';

break;

case 'U':

result = 'A';

break;

case 'r':

result = 'y';

break;

case 'R':

result = 'Y';

break;

case 'y':

result = 'r';

break;

case 'Y':

result = 'R';

break;

case 'k':

result = 'm';

break;

case 'K':

result = 'M';

break;

case 'm':

result = 'k';

break;

case 'M':

result = 'K';

break;

case 'b':

result = 'v';

break;

case 'B':

result = 'V';

break;

case 'v':

result = 'b';

break;

case 'V':

result = 'B';

break;

case 'd':

result = 'h';

break;

case 'D':

result = 'H';

break;

case 'h':

result = 'd';

break;

case 'H':

result = 'D';

break;

}

return result;

}

}

Coverage Report

File Dna.java

Coverage histogram

Code metrics

Classes

Class Dna

Contributing tests

Contributing tests

Source view