1 package jalview.io.vamsas;
\r
3 import java.io.IOException;
\r
4 import java.util.Enumeration;
\r
5 import java.util.Hashtable;
\r
6 import java.util.Vector;
\r
8 import jalview.analysis.NJTree;
\r
9 import jalview.analysis.SequenceIdMatcher;
\r
10 import jalview.bin.Cache;
\r
11 import jalview.datamodel.AlignmentI;
\r
12 import jalview.datamodel.AlignmentView;
\r
13 import jalview.datamodel.BinaryNode;
\r
14 import jalview.datamodel.SeqCigar;
\r
15 import jalview.datamodel.Sequence;
\r
16 import jalview.datamodel.SequenceI;
\r
17 import jalview.datamodel.SequenceNode;
\r
18 import jalview.gui.AlignFrame;
\r
19 import jalview.gui.AlignViewport;
\r
20 import jalview.gui.TreePanel;
\r
21 import jalview.io.NewickFile;
\r
22 import jalview.io.VamsasAppDatastore;
\r
23 import uk.ac.vamsas.client.Vobject;
\r
24 import uk.ac.vamsas.objects.core.AlignmentSequence;
\r
25 import uk.ac.vamsas.objects.core.Entry;
\r
26 import uk.ac.vamsas.objects.core.Input;
\r
27 import uk.ac.vamsas.objects.core.Newick;
\r
28 import uk.ac.vamsas.objects.core.Param;
\r
29 import uk.ac.vamsas.objects.core.Provenance;
\r
30 import uk.ac.vamsas.objects.core.Seg;
\r
31 import uk.ac.vamsas.objects.core.Treenode;
\r
32 import uk.ac.vamsas.objects.core.Vref;
\r
34 public class Tree extends DatastoreItem
\r
40 uk.ac.vamsas.objects.core.Tree tree;
\r
42 uk.ac.vamsas.objects.core.Alignment alignment; // may be null => dataset or
\r
44 // other kind of tree
\r
45 private NewickFile ntree;
\r
47 private String title;
\r
49 private AlignmentView inputData = null;
\r
51 public static void updateFrom(VamsasAppDatastore datastore,
\r
52 jalview.gui.AlignFrame alignFrame,
\r
53 uk.ac.vamsas.objects.core.Tree vtree)
\r
55 Tree toTree = new Tree(datastore, alignFrame, vtree);
\r
59 public Tree(VamsasAppDatastore datastore,
\r
60 jalview.gui.AlignFrame alignFrame,
\r
61 uk.ac.vamsas.objects.core.Tree vtree)
\r
65 TreePanel tp = (TreePanel) getvObj2jv(tree);
\r
68 if (tree.isUpdated())
\r
71 .info("Update from vamsas document to alignment associated tree not implemented yet.");
\r
77 Object[] idata = recoverInputData(tree.getProvenance());
\r
80 if (idata != null && idata[0] != null)
\r
82 inputData = (AlignmentView) idata[0];
\r
85 title = tree.getNewick(0).getTitle();
\r
86 if (title == null || title.length() == 0)
\r
88 title = tree.getTitle(); // hack!!!!
\r
90 } catch (Exception e)
\r
92 Cache.log.warn("Problems parsing treefile '"
\r
93 + tree.getNewick(0).getContent() + "'", e);
\r
98 private NewickFile getNtree() throws IOException
\r
100 return new jalview.io.NewickFile(tree.getNewick(0).getContent());
\r
103 public Tree(VamsasAppDatastore datastore, TreePanel tp2, AlignmentI jal2,
\r
104 uk.ac.vamsas.objects.core.Alignment alignment2)
\r
110 alignment = alignment2;
\r
112 tree = (uk.ac.vamsas.objects.core.Tree) getjv2vObj(tp);
\r
119 if (isModifiable(tree.getModifiable()))
\r
121 // synchronize(); // update();
\r
122 // verify any changes.
\r
123 System.out.println("Update tree in document.");
\r
128 System.out.println("Add modified tree as new tree in document.");
\r
134 * correctly creates provenance for trees calculated on an alignment by
\r
141 private Provenance makeTreeProvenance(AlignmentI jal, TreePanel tp)
\r
143 Cache.log.debug("Making Tree provenance for " + tp.getTitle());
\r
144 Provenance prov = new Provenance();
\r
145 prov.addEntry(new Entry());
\r
146 prov.getEntry(0).setAction("imported " + tp.getTitle());
\r
147 prov.getEntry(0).setUser(provEntry.getUser());
\r
148 prov.getEntry(0).setApp(provEntry.getApp());
\r
149 prov.getEntry(0).setDate(provEntry.getDate());
\r
150 if (tp.getTree().hasOriginalSequenceData())
\r
152 Input vInput = new Input();
\r
153 // LATER: check to see if tree input data is contained in this alignment -
\r
154 // or just correctly resolve the tree's seqData to the correct alignment
\r
157 Vector alsqrefs = getjv2vObjs(findAlignmentSequences(jal, tp
\r
158 .getTree().seqData.getSequences()));
\r
159 Object[] alsqs = new Object[alsqrefs.size()];
\r
160 alsqrefs.copyInto(alsqs);
\r
161 vInput.setObjRef(alsqs);
\r
162 // now create main provenance data
\r
163 prov.getEntry(0).setAction("created " + tp.getTitle());
\r
164 prov.getEntry(0).addInput(vInput);
\r
165 // jalview's special input parameter for distance matrix calculations
\r
166 vInput.setName("jalview:seqdist"); // TODO: settle on appropriate name.
\r
167 prov.getEntry(0).addParam(new Param());
\r
168 prov.getEntry(0).getParam(0).setName("treeType");
\r
169 prov.getEntry(0).getParam(0).setType("utf8");
\r
170 prov.getEntry(0).getParam(0).setContent("NJ"); // TODO: type of tree is a
\r
171 // general parameter
\r
172 int ranges[] = tp.getTree().seqData.getVisibleContigs();
\r
173 // VisibleContigs are with respect to alignment coordinates. Still need
\r
175 int start = tp.getTree().seqData.getAlignmentOrigin();
\r
176 for (int r = 0; r < ranges.length; r += 2)
\r
178 Seg visSeg = new Seg();
\r
179 visSeg.setStart(1 + start + ranges[r]);
\r
180 visSeg.setEnd(start + ranges[r + 1]);
\r
181 visSeg.setInclusive(true);
\r
182 vInput.addSeg(visSeg);
\r
185 Cache.log.debug("Finished Tree provenance for " + tp.getTitle());
\r
190 * look up SeqCigars in an existing alignment.
\r
194 * @return vector of alignment sequences in order of SeqCigar array (but
\r
195 * missing unfound seqcigars)
\r
197 private Vector findAlignmentSequences(AlignmentI jal, SeqCigar[] sequences)
\r
199 SeqCigar[] tseqs = new SeqCigar[sequences.length];
\r
200 System.arraycopy(sequences, 0, tseqs, 0, sequences.length);
\r
201 Vector alsq = new Vector();
\r
202 Enumeration as = jal.getSequences().elements();
\r
203 while (as.hasMoreElements())
\r
205 SequenceI asq = (SequenceI) as.nextElement();
\r
206 for (int t = 0; t < sequences.length; t++)
\r
208 if (tseqs[t] != null
\r
209 && (tseqs[t].getRefSeq() == asq || tseqs[t].getRefSeq() == asq
\r
210 .getDatasetSequence()))
\r
211 // && tseqs[t].getStart()>=asq.getStart() &&
\r
212 // tseqs[t].getEnd()<=asq.getEnd())
\r
219 if (alsq.size() < sequences.length)
\r
221 .warn("Not recovered all alignment sequences for given set of input sequence CIGARS");
\r
227 * Update jalview newick representation with TreeNode map
\r
230 * the treepanel that this tree is bound to.
\r
232 public void UpdateSequenceTreeMap(TreePanel tp)
\r
234 if (tp == null || tree != null)
\r
236 Vector leaves = new Vector();
\r
237 tp.getTree().findLeaves(tp.getTree().getTopNode(), leaves);
\r
238 Treenode[] tn = tree.getTreenode(); // todo: select nodes for this
\r
240 int sz = tn.length;
\r
245 Treenode node = tn[i++];
\r
246 BinaryNode mappednode = findNodeSpec(node.getNodespec(), leaves);
\r
247 if (mappednode != null && mappednode instanceof SequenceNode)
\r
249 SequenceNode leaf = (SequenceNode) leaves.elementAt(i++);
\r
250 // check if we can make the specified association
\r
251 Object jvseq = null;
\r
252 int vrf = 0, refv = 0;
\r
253 while (jvseq == null && vrf < node.getVrefCount())
\r
255 if (refv < node.getVref(vrf).getRefsCount())
\r
257 Object noderef = node.getVref(vrf).getRefs(refv++);
\r
258 if (noderef instanceof AlignmentSequence)
\r
260 // we only make these kind of associations
\r
261 jvseq = getvObj2jv((Vobject) noderef);
\r
270 if (jvseq instanceof SequenceI)
\r
272 leaf.setElement(jvseq);
\r
273 leaf.setPlaceholder(false);
\r
277 leaf.setPlaceholder(true);
\r
279 .setElement(new Sequence(leaf.getName(),
\r
280 "THISISAPLACEHLDER"));
\r
286 // / TODO: refactor to vamsas :start
\r
288 * construct treenode mappings for mapped sequences
\r
294 public Treenode[] makeTreeNodes(NJTree ntree, Newick newick)
\r
296 Vector leaves = new Vector();
\r
297 ntree.findLeaves(ntree.getTopNode(), leaves);
\r
298 Vector tnv = new Vector();
\r
299 Enumeration l = leaves.elements();
\r
300 Hashtable nodespecs = new Hashtable();
\r
301 while (l.hasMoreElements())
\r
303 jalview.datamodel.BinaryNode tnode = (jalview.datamodel.BinaryNode) l
\r
305 if (tnode instanceof jalview.datamodel.SequenceNode)
\r
307 if (!((jalview.datamodel.SequenceNode) tnode).isPlaceholder())
\r
309 Object assocseq = ((jalview.datamodel.SequenceNode) tnode)
\r
311 if (assocseq instanceof SequenceI)
\r
313 Vobject vobj = this.getjv2vObj(assocseq);
\r
316 Treenode node = new Treenode();
\r
317 if (newick.isRegisterable())
\r
319 this.cdoc.registerObject(newick);
\r
320 node.addTreeId(newick);
\r
322 node.setNodespec(makeNodeSpec(nodespecs, tnode));
\r
323 node.setName(tnode.getName());
\r
324 Vref vr = new Vref();
\r
327 tnv.addElement(node);
\r
331 System.err.println("WARNING: Unassociated treeNode "
\r
332 + tnode.element().toString()
\r
334 + ((tnode.getName() != null) ? " label "
\r
335 + tnode.getName() : ""));
\r
341 if (tnv.size() > 0)
\r
343 Treenode[] tn = new Treenode[tnv.size()];
\r
347 return new Treenode[]
\r
351 private String makeNodeSpec(Hashtable nodespecs,
\r
352 jalview.datamodel.BinaryNode tnode)
\r
354 String nname = new String(tnode.getName());
\r
355 Integer nindx = (Integer) nodespecs.get(nname);
\r
358 nindx = new Integer(1);
\r
360 nname = nindx.toString() + " " + nname;
\r
365 * call to match up Treenode specs to NJTree parsed from document object.
\r
369 * as returned from NJTree.findLeaves( .., ..) ..
\r
372 private jalview.datamodel.BinaryNode findNodeSpec(String nodespec,
\r
375 int occurence = -1;
\r
376 String nspec = nodespec.substring(nodespec.indexOf(' ') + 1);
\r
377 String oval = nodespec.substring(0, nodespec.indexOf(' '));
\r
380 occurence = new Integer(oval).intValue();
\r
381 } catch (Exception e)
\r
383 System.err.println("Invalid nodespec '" + nodespec + "'");
\r
386 jalview.datamodel.BinaryNode bn = null;
\r
389 Enumeration en = leaves.elements();
\r
390 while (en.hasMoreElements() && nocc < occurence)
\r
392 bn = (jalview.datamodel.BinaryNode) en.nextElement();
\r
393 if (bn instanceof jalview.datamodel.SequenceNode
\r
394 && bn.getName().equals(nspec))
\r
404 // todo: end refactor to vamsas library
\r
406 * add jalview object to vamsas document
\r
411 tree = new uk.ac.vamsas.objects.core.Tree();
\r
412 bindjvvobj(tp, tree);
\r
413 tree.setTitle(tp.getTitle());
\r
414 Newick newick = new Newick();
\r
415 newick.setContent(tp.getTree().toString());
\r
416 newick.setTitle(tp.getTitle());
\r
417 tree.addNewick(newick);
\r
418 tree.setProvenance(makeTreeProvenance(jal, tp));
\r
419 tree.setTreenode(makeTreeNodes(tp.getTree(), newick));
\r
421 alignment.addTree(tree);
\r
425 * note: this function assumes that all sequence and alignment objects
\r
426 * referenced in input data has already been associated with jalview objects.
\r
429 * @param alignFrame
\r
430 * @return Object[] { AlignmentView, AlignmentI - reference alignment for
\r
433 public Object[] recoverInputData(Provenance tp)
\r
435 AlignViewport javport = null;
\r
436 jalview.datamodel.AlignmentI jal = null;
\r
437 jalview.datamodel.CigarArray view = null;
\r
438 for (int pe = 0; pe < tp.getEntryCount(); pe++)
\r
440 if (tp.getEntry(pe).getInputCount() > 0)
\r
442 if (tp.getEntry(pe).getInputCount() > 1)
\r
445 .warn("Ignoring additional input spec in provenance entry "
\r
446 + tp.getEntry(pe).toString());
\r
448 // LATER: deal sensibly with multiple inputs
\r
449 Input vInput = tp.getEntry(pe).getInput(0);
\r
450 // is this the whole alignment or a specific set of sequences ?
\r
451 if (vInput.getObjRefCount() == 0)
\r
453 if (tree.getV_parent()!=null && tree.getV_parent() instanceof uk.ac.vamsas.objects.core.Alignment)
\r
455 javport = getViewport(tree.getV_parent());
\r
456 jal = javport.getAlignment();
\r
457 view = javport.getAlignment().getCompactAlignment();
\r
462 // Explicit reference - to alignment, sequences or what.
\r
463 if (vInput.getObjRefCount() == 1
\r
464 && vInput.getObjRef(0) instanceof uk.ac.vamsas.objects.core.Alignment)
\r
466 // recover an AlignmentView for the input data
\r
467 javport = getViewport((Vobject) vInput.getObjRef(0));
\r
468 jal = javport.getAlignment();
\r
469 view = javport.getAlignment().getCompactAlignment();
\r
471 else if (vInput.getObjRef(0) instanceof uk.ac.vamsas.objects.core.AlignmentSequence)
\r
473 // recover an AlignmentView for the input data
\r
474 javport = getViewport(((Vobject) vInput.getObjRef(0)).getV_parent());
\r
475 jal = javport.getAlignment();
\r
476 jalview.datamodel.SequenceI[] seqs = new jalview.datamodel.SequenceI[vInput
\r
477 .getObjRefCount()];
\r
478 for (int i = 0, iSize = vInput.getObjRefCount(); i < iSize; i++)
\r
480 SequenceI seq = (SequenceI) getvObj2jv((Vobject) vInput
\r
484 view = new jalview.datamodel.Alignment(seqs)
\r
485 .getCompactAlignment();
\r
489 int from = 1, to = jal.getWidth();
\r
490 int offset = 0; // deleteRange modifies its frame of reference
\r
491 for (int r = 0, s = vInput.getSegCount(); r < s; r++)
\r
493 Seg visSeg = vInput.getSeg(r);
\r
494 int se[] = getSegRange(visSeg, true); // jalview doesn't do
\r
495 // bidirection alignments yet.
\r
498 Cache.log.warn("Ignoring invalid segment in InputData spec.");
\r
504 view.deleteRange(offset + from - 1, offset + se[0] - 2);
\r
505 offset -= se[0] - from;
\r
512 view.deleteRange(offset + from - 1, offset + to - 1); // final
\r
518 return new Object[]
\r
519 { new AlignmentView(view), jal };
\r
523 .debug("Returning null for input data recovery from provenance.");
\r
527 private AlignViewport getViewport(Vobject v_parent)
\r
529 if (v_parent instanceof uk.ac.vamsas.objects.core.Alignment)
\r
532 .findViewport((uk.ac.vamsas.objects.core.Alignment) v_parent);
\r
537 public NewickFile getNewickTree()
\r
542 public String getTitle()
\r
547 public AlignmentView getInputData()
\r
552 public boolean isValidTree()
\r
557 if (ntree.getTree() != null)
\r
559 ntree = getNtree();
\r
562 } catch (Exception e)
\r
564 Cache.log.debug("Failed to parse newick tree string", e);
\r