1 |
|
|
2 |
|
|
3 |
|
|
4 |
|
|
5 |
|
|
6 |
|
|
7 |
|
|
8 |
|
|
9 |
|
|
10 |
|
|
11 |
|
|
12 |
|
|
13 |
|
|
14 |
|
|
15 |
|
|
16 |
|
|
17 |
|
|
18 |
|
|
19 |
|
|
20 |
|
|
21 |
|
package jalview.analysis; |
22 |
|
|
23 |
|
import jalview.api.analysis.ScoreModelI; |
24 |
|
import jalview.api.analysis.SimilarityParamsI; |
25 |
|
import jalview.datamodel.AlignmentView; |
26 |
|
import jalview.datamodel.CigarArray; |
27 |
|
import jalview.datamodel.SeqCigar; |
28 |
|
import jalview.datamodel.SequenceI; |
29 |
|
import jalview.datamodel.SequenceNode; |
30 |
|
import jalview.math.MatrixI; |
31 |
|
import jalview.viewmodel.AlignmentViewport; |
32 |
|
|
33 |
|
import java.util.BitSet; |
34 |
|
import java.util.Vector; |
35 |
|
|
|
|
| 0% |
Uncovered Elements: 168 (168) |
Complexity: 40 |
Complexity Density: 0.35 |
|
36 |
|
public abstract class TreeBuilder |
37 |
|
{ |
38 |
|
public static final String AVERAGE_DISTANCE = "AV"; |
39 |
|
|
40 |
|
public static final String NEIGHBOUR_JOINING = "NJ"; |
41 |
|
|
42 |
|
protected Vector<BitSet> clusters; |
43 |
|
|
44 |
|
protected SequenceI[] sequences; |
45 |
|
|
46 |
|
public AlignmentView seqData; |
47 |
|
|
48 |
|
protected BitSet done; |
49 |
|
|
50 |
|
protected int noseqs; |
51 |
|
|
52 |
|
int noClus; |
53 |
|
|
54 |
|
protected MatrixI distances; |
55 |
|
|
56 |
|
protected int mini; |
57 |
|
|
58 |
|
protected int minj; |
59 |
|
|
60 |
|
protected double ri; |
61 |
|
|
62 |
|
protected double rj; |
63 |
|
|
64 |
|
SequenceNode maxdist; |
65 |
|
|
66 |
|
SequenceNode top; |
67 |
|
|
68 |
|
double maxDistValue; |
69 |
|
|
70 |
|
double maxheight; |
71 |
|
|
72 |
|
int ycount; |
73 |
|
|
74 |
|
Vector<SequenceNode> node; |
75 |
|
|
76 |
|
private AlignmentView seqStrings; |
77 |
|
|
78 |
|
|
79 |
|
|
80 |
|
|
81 |
|
@param |
82 |
|
@param |
83 |
|
@param |
84 |
|
|
|
|
| 0% |
Uncovered Elements: 14 (14) |
Complexity: 2 |
Complexity Density: 0.17 |
|
85 |
0 |
public TreeBuilder(AlignmentViewport av, ScoreModelI sm,... |
86 |
|
SimilarityParamsI scoreParameters) |
87 |
|
{ |
88 |
0 |
int start, end; |
89 |
0 |
boolean selview = av.getSelectionGroup() != null |
90 |
|
&& av.getSelectionGroup().getSize() > 1; |
91 |
0 |
seqStrings = av.getAlignmentView(selview); |
92 |
0 |
if (!selview) |
93 |
|
{ |
94 |
0 |
start = 0; |
95 |
0 |
end = av.getAlignment().getWidth(); |
96 |
0 |
this.sequences = av.getAlignment().getSequencesArray(); |
97 |
|
} |
98 |
|
else |
99 |
|
{ |
100 |
0 |
start = av.getSelectionGroup().getStartRes(); |
101 |
0 |
end = av.getSelectionGroup().getEndRes() + 1; |
102 |
0 |
this.sequences = av.getSelectionGroup() |
103 |
|
.getSequencesInOrder(av.getAlignment()); |
104 |
|
} |
105 |
|
|
106 |
0 |
init(seqStrings, start, end); |
107 |
|
|
108 |
0 |
computeTree(sm, scoreParameters); |
109 |
|
} |
110 |
|
|
|
|
| 0% |
Uncovered Elements: 1 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
111 |
0 |
public SequenceI[] getSequences()... |
112 |
|
{ |
113 |
0 |
return sequences; |
114 |
|
} |
115 |
|
|
116 |
|
|
117 |
|
|
118 |
|
|
119 |
|
@param |
120 |
|
|
121 |
|
|
122 |
|
@return |
123 |
|
|
|
|
| 0% |
Uncovered Elements: 22 (22) |
Complexity: 6 |
Complexity Density: 0.43 |
|
124 |
0 |
double findHeight(SequenceNode nd)... |
125 |
|
{ |
126 |
0 |
if (nd == null) |
127 |
|
{ |
128 |
0 |
return maxheight; |
129 |
|
} |
130 |
|
|
131 |
0 |
if ((nd.left() == null) && (nd.right() == null)) |
132 |
|
{ |
133 |
0 |
nd.height = ((SequenceNode) nd.parent()).height + nd.dist; |
134 |
|
|
135 |
0 |
if (nd.height > maxheight) |
136 |
|
{ |
137 |
0 |
return nd.height; |
138 |
|
} |
139 |
|
else |
140 |
|
{ |
141 |
0 |
return maxheight; |
142 |
|
} |
143 |
|
} |
144 |
|
else |
145 |
|
{ |
146 |
0 |
if (nd.parent() != null) |
147 |
|
{ |
148 |
0 |
nd.height = ((SequenceNode) nd.parent()).height + nd.dist; |
149 |
|
} |
150 |
|
else |
151 |
|
{ |
152 |
0 |
maxheight = 0; |
153 |
0 |
nd.height = (float) 0.0; |
154 |
|
} |
155 |
|
|
156 |
0 |
maxheight = findHeight((SequenceNode) (nd.left())); |
157 |
0 |
maxheight = findHeight((SequenceNode) (nd.right())); |
158 |
|
} |
159 |
|
|
160 |
0 |
return maxheight; |
161 |
|
} |
162 |
|
|
163 |
|
|
164 |
|
|
165 |
|
|
166 |
|
@param |
167 |
|
|
168 |
|
|
|
|
| 0% |
Uncovered Elements: 2 (2) |
Complexity: 1 |
Complexity Density: 0.5 |
|
169 |
0 |
void reCount(SequenceNode nd)... |
170 |
|
{ |
171 |
0 |
ycount = 0; |
172 |
|
|
173 |
|
|
174 |
0 |
_reCount(nd); |
175 |
|
} |
176 |
|
|
177 |
|
|
178 |
|
|
179 |
|
|
180 |
|
@param |
181 |
|
|
182 |
|
|
|
|
| 0% |
Uncovered Elements: 15 (15) |
Complexity: 4 |
Complexity Density: 0.36 |
|
183 |
0 |
void _reCount(SequenceNode nd)... |
184 |
|
{ |
185 |
|
|
186 |
|
|
187 |
|
|
188 |
|
|
189 |
|
|
190 |
0 |
if (nd == null) |
191 |
|
{ |
192 |
0 |
return; |
193 |
|
} |
194 |
|
|
195 |
|
|
196 |
0 |
if ((nd.left() != null) && (nd.right() != null)) |
197 |
|
{ |
198 |
|
|
199 |
0 |
_reCount((SequenceNode) nd.left()); |
200 |
0 |
_reCount((SequenceNode) nd.right()); |
201 |
|
|
202 |
0 |
SequenceNode l = (SequenceNode) nd.left(); |
203 |
0 |
SequenceNode r = (SequenceNode) nd.right(); |
204 |
|
|
205 |
0 |
nd.count = l.count + r.count; |
206 |
0 |
nd.ycount = (l.ycount + r.ycount) / 2; |
207 |
|
} |
208 |
|
else |
209 |
|
{ |
210 |
0 |
nd.count = 1; |
211 |
0 |
nd.ycount = ycount++; |
212 |
|
} |
213 |
|
|
214 |
|
} |
215 |
|
|
216 |
|
|
217 |
|
|
218 |
|
|
219 |
|
@return |
220 |
|
|
|
|
| 0% |
Uncovered Elements: 1 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
221 |
0 |
public SequenceNode getTopNode()... |
222 |
|
{ |
223 |
0 |
return top; |
224 |
|
} |
225 |
|
|
226 |
|
|
227 |
|
|
228 |
|
@return |
229 |
|
|
|
|
| 0% |
Uncovered Elements: 1 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
230 |
0 |
public boolean hasDistances()... |
231 |
|
{ |
232 |
0 |
return true; |
233 |
|
} |
234 |
|
|
235 |
|
|
236 |
|
|
237 |
|
@return |
238 |
|
|
|
|
| 0% |
Uncovered Elements: 1 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
239 |
0 |
public boolean hasBootstrap()... |
240 |
|
{ |
241 |
0 |
return false; |
242 |
|
} |
243 |
|
|
|
|
| 0% |
Uncovered Elements: 1 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
244 |
0 |
public boolean hasRootDistance()... |
245 |
|
{ |
246 |
0 |
return true; |
247 |
|
} |
248 |
|
|
249 |
|
|
250 |
|
|
251 |
|
|
252 |
|
|
|
|
| 0% |
Uncovered Elements: 13 (13) |
Complexity: 2 |
Complexity Density: 0.18 |
|
253 |
0 |
void cluster()... |
254 |
|
{ |
255 |
0 |
while (noClus > 2) |
256 |
|
{ |
257 |
0 |
findMinDistance(); |
258 |
|
|
259 |
0 |
joinClusters(mini, minj); |
260 |
|
|
261 |
0 |
noClus--; |
262 |
|
} |
263 |
|
|
264 |
0 |
int rightChild = done.nextClearBit(0); |
265 |
0 |
int leftChild = done.nextClearBit(rightChild + 1); |
266 |
|
|
267 |
0 |
joinClusters(leftChild, rightChild); |
268 |
0 |
top = (node.elementAt(leftChild)); |
269 |
|
|
270 |
0 |
reCount(top); |
271 |
0 |
findHeight(top); |
272 |
0 |
findMaxDist(top); |
273 |
|
} |
274 |
|
|
275 |
|
|
276 |
|
|
277 |
|
|
278 |
|
|
279 |
|
@return |
280 |
|
|
281 |
|
protected abstract double findMinDistance(); |
282 |
|
|
283 |
|
|
284 |
|
|
285 |
|
|
286 |
|
|
287 |
|
|
288 |
|
|
289 |
|
|
290 |
|
|
291 |
|
|
292 |
|
|
293 |
|
@param |
294 |
|
@param |
295 |
|
|
|
|
| 0% |
Uncovered Elements: 4 (4) |
Complexity: 1 |
Complexity Density: 0.25 |
|
296 |
0 |
protected void computeTree(ScoreModelI sm, SimilarityParamsI scoreOptions)... |
297 |
|
{ |
298 |
0 |
distances = sm.findDistances(seqData, scoreOptions); |
299 |
|
|
300 |
0 |
makeLeaves(); |
301 |
|
|
302 |
0 |
noClus = clusters.size(); |
303 |
|
|
304 |
0 |
cluster(); |
305 |
|
} |
306 |
|
|
307 |
|
|
308 |
|
|
309 |
|
|
310 |
|
|
311 |
|
@param |
312 |
|
|
|
|
| 0% |
Uncovered Elements: 15 (15) |
Complexity: 5 |
Complexity Density: 0.56 |
|
313 |
0 |
void findMaxDist(SequenceNode nd)... |
314 |
|
{ |
315 |
0 |
if (nd == null) |
316 |
|
{ |
317 |
0 |
return; |
318 |
|
} |
319 |
|
|
320 |
0 |
if ((nd.left() == null) && (nd.right() == null)) |
321 |
|
{ |
322 |
0 |
double dist = nd.dist; |
323 |
|
|
324 |
0 |
if (dist > maxDistValue) |
325 |
|
{ |
326 |
0 |
maxdist = nd; |
327 |
0 |
maxDistValue = dist; |
328 |
|
} |
329 |
|
} |
330 |
|
else |
331 |
|
{ |
332 |
0 |
findMaxDist((SequenceNode) nd.left()); |
333 |
0 |
findMaxDist((SequenceNode) nd.right()); |
334 |
|
} |
335 |
|
} |
336 |
|
|
337 |
|
|
338 |
|
|
339 |
|
|
340 |
|
@param |
341 |
|
@param |
342 |
|
|
343 |
|
@return |
344 |
|
|
|
|
| 0% |
Uncovered Elements: 13 (13) |
Complexity: 6 |
Complexity Density: 0.86 |
|
345 |
0 |
protected double findr(int i, int j)... |
346 |
|
{ |
347 |
0 |
double tmp = 1; |
348 |
|
|
349 |
0 |
for (int k = 0; k < noseqs; k++) |
350 |
|
{ |
351 |
0 |
if ((k != i) && (k != j) && (!done.get(k))) |
352 |
|
{ |
353 |
0 |
tmp = tmp + distances.getValue(i, k); |
354 |
|
} |
355 |
|
} |
356 |
|
|
357 |
0 |
if (noClus > 2) |
358 |
|
{ |
359 |
0 |
tmp = tmp / (noClus - 2); |
360 |
|
} |
361 |
|
|
362 |
0 |
return tmp; |
363 |
|
} |
364 |
|
|
|
|
| 0% |
Uncovered Elements: 20 (20) |
Complexity: 4 |
Complexity Density: 0.29 |
|
365 |
0 |
protected void init(AlignmentView seqView, int start, int end)... |
366 |
|
{ |
367 |
0 |
this.node = new Vector<SequenceNode>(); |
368 |
0 |
if (seqView != null) |
369 |
|
{ |
370 |
0 |
this.seqData = seqView; |
371 |
|
} |
372 |
|
else |
373 |
|
{ |
374 |
0 |
SeqCigar[] seqs = new SeqCigar[sequences.length]; |
375 |
0 |
for (int i = 0; i < sequences.length; i++) |
376 |
|
{ |
377 |
0 |
seqs[i] = new SeqCigar(sequences[i], start, end); |
378 |
|
} |
379 |
0 |
CigarArray sdata = new CigarArray(seqs); |
380 |
0 |
sdata.addOperation(CigarArray.M, end - start + 1); |
381 |
0 |
this.seqData = new AlignmentView(sdata, start); |
382 |
|
} |
383 |
|
|
384 |
|
|
385 |
|
|
386 |
|
|
387 |
0 |
noseqs = 0; |
388 |
|
|
389 |
0 |
done = new BitSet(); |
390 |
|
|
391 |
0 |
for (SequenceI seq : sequences) |
392 |
|
{ |
393 |
0 |
if (seq != null) |
394 |
|
{ |
395 |
0 |
noseqs++; |
396 |
|
} |
397 |
|
} |
398 |
|
} |
399 |
|
|
400 |
|
|
401 |
|
|
402 |
|
|
403 |
|
@param |
404 |
|
@param |
405 |
|
|
|
|
| 0% |
Uncovered Elements: 16 (16) |
Complexity: 1 |
Complexity Density: 0.06 |
|
406 |
0 |
void joinClusters(final int i, final int j)... |
407 |
|
{ |
408 |
0 |
double dist = distances.getValue(i, j); |
409 |
|
|
410 |
0 |
ri = findr(i, j); |
411 |
0 |
rj = findr(j, i); |
412 |
|
|
413 |
0 |
findClusterDistance(i, j); |
414 |
|
|
415 |
0 |
SequenceNode sn = new SequenceNode(); |
416 |
|
|
417 |
0 |
sn.setLeft((node.elementAt(i))); |
418 |
0 |
sn.setRight((node.elementAt(j))); |
419 |
|
|
420 |
0 |
SequenceNode tmpi = (node.elementAt(i)); |
421 |
0 |
SequenceNode tmpj = (node.elementAt(j)); |
422 |
|
|
423 |
0 |
findNewDistances(tmpi, tmpj, dist); |
424 |
|
|
425 |
0 |
tmpi.setParent(sn); |
426 |
0 |
tmpj.setParent(sn); |
427 |
|
|
428 |
0 |
node.setElementAt(sn, i); |
429 |
|
|
430 |
|
|
431 |
|
|
432 |
|
|
433 |
|
|
434 |
0 |
clusters.get(i).or(clusters.get(j)); |
435 |
0 |
clusters.get(j).clear(); |
436 |
0 |
done.set(j); |
437 |
|
} |
438 |
|
|
439 |
|
|
440 |
|
|
441 |
|
|
442 |
|
|
443 |
|
protected abstract void findNewDistances(SequenceNode nodei, |
444 |
|
SequenceNode nodej, double previousDistance); |
445 |
|
|
446 |
|
|
447 |
|
|
448 |
|
|
449 |
|
|
450 |
|
|
451 |
|
@param |
452 |
|
@param |
453 |
|
|
454 |
|
protected abstract void findClusterDistance(int i, int j); |
455 |
|
|
456 |
|
|
457 |
|
|
458 |
|
|
|
|
| 0% |
Uncovered Elements: 11 (11) |
Complexity: 2 |
Complexity Density: 0.22 |
|
459 |
0 |
void makeLeaves()... |
460 |
|
{ |
461 |
0 |
clusters = new Vector<BitSet>(); |
462 |
|
|
463 |
0 |
for (int i = 0; i < noseqs; i++) |
464 |
|
{ |
465 |
0 |
SequenceNode sn = new SequenceNode(); |
466 |
|
|
467 |
0 |
sn.setElement(sequences[i]); |
468 |
0 |
sn.setName(sequences[i].getName()); |
469 |
0 |
node.addElement(sn); |
470 |
0 |
BitSet bs = new BitSet(); |
471 |
0 |
bs.set(i); |
472 |
0 |
clusters.addElement(bs); |
473 |
|
} |
474 |
|
} |
475 |
|
|
|
|
| 0% |
Uncovered Elements: 1 (1) |
Complexity: 1 |
Complexity Density: 1 |
|
476 |
0 |
public AlignmentView getOriginalData()... |
477 |
|
{ |
478 |
0 |
return seqStrings; |
479 |
|
} |
480 |
|
|
481 |
|
} |