2 * Jalview - A Sequence Alignment Editor and Viewer
\r
3 * Copyright (C) 2007 AM Waterhouse, J Procter, G Barton, M Clamp, S Searle
\r
5 * This program is free software; you can redistribute it and/or
\r
6 * modify it under the terms of the GNU General Public License
\r
7 * as published by the Free Software Foundation; either version 2
\r
8 * of the License, or (at your option) any later version.
\r
10 * This program is distributed in the hope that it will be useful,
\r
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
\r
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
\r
13 * GNU General Public License for more details.
\r
15 * You should have received a copy of the GNU General Public License
\r
16 * along with this program; if not, write to the Free Software
\r
17 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
\r
24 import javax.swing.*;
\r
26 import org.biojava.dasobert.das.*;
\r
27 import org.biojava.dasobert.das2.*;
\r
28 import org.biojava.dasobert.das2.io.*;
\r
29 import org.biojava.dasobert.dasregistry.*;
\r
30 import org.biojava.dasobert.eventmodel.*;
\r
31 import jalview.bin.Cache;
\r
32 import jalview.datamodel.*;
\r
33 import jalview.gui.*;
\r
39 * @version $Revision$
\r
41 public class DasSequenceFeatureFetcher
\r
43 SequenceI[] sequences;
\r
47 FeatureSettings fsettings;
\r
49 StringBuffer sbuffer = new StringBuffer();
\r
51 Vector selectedSources;
\r
53 boolean cancelled = false;
\r
54 private void debug(String mesg)
\r
58 private void debug(String mesg, Exception e)
\r
60 if (Cache.log!=null)
\r
62 Cache.log.debug(mesg, e);
\r
64 System.err.println(mesg);
\r
67 e.printStackTrace();
\r
74 * Creates a new SequenceFeatureFetcher object.
\r
77 * @param align DOCUMENT ME!
\r
78 * @param ap DOCUMENT ME!
\r
80 public DasSequenceFeatureFetcher(SequenceI[] sequences,
\r
81 FeatureSettings fsettings, Vector selectedSources)
\r
83 this(sequences, fsettings, selectedSources, true, true);
\r
85 public DasSequenceFeatureFetcher(SequenceI[] sequences,
\r
86 FeatureSettings fsettings, Vector selectedSources, boolean checkDbrefs, boolean promptFetchDbrefs)
\r
88 this.selectedSources = selectedSources;
\r
89 this.sequences = sequences;
\r
90 if (fsettings!=null)
\r
92 this.fsettings = fsettings;
\r
93 this.af = fsettings.af;
\r
94 af.getViewport().setShowSequenceFeatures(true);
\r
96 int uniprotCount = 0;
\r
97 for (int i = 0; i < selectedSources.size(); i++)
\r
99 DasSource source = (DasSource) selectedSources.elementAt(i);
\r
100 DasCoordinateSystem[] coords = source.getCoordinateSystem();
\r
101 for (int c = 0; c < coords.length; c++)
\r
103 if (coords[c].getName().indexOf("UniProt") > -1)
\r
112 for (int i = 0; i < sequences.length; i++)
\r
114 DBRefEntry[] dbref = sequences[i].getDBRef();
\r
117 for (int j = 0; j < dbref.length; j++)
\r
119 if (dbref[j].getSource().equals(
\r
120 jalview.datamodel.DBRefSource.UNIPROT))
\r
129 if (checkDbrefs && refCount < sequences.length && uniprotCount > 0)
\r
132 int reply = JOptionPane.YES_OPTION;
\r
133 if (promptFetchDbrefs)
\r
135 reply = JOptionPane.showInternalConfirmDialog(Desktop.desktop,
\r
136 "Do you want Jalview to find\n"
\r
137 + "Uniprot Accession ids for given sequence names?",
\r
138 "Find Uniprot Accession Ids", JOptionPane.YES_NO_OPTION,
\r
139 JOptionPane.QUESTION_MESSAGE);
\r
143 if (reply == JOptionPane.YES_OPTION)
\r
145 Thread thread = new Thread(new FetchDBRefs());
\r
160 class FetchDBRefs implements Runnable
\r
164 new DBRefFetcher(sequences, af).fetchDBRefs(true);
\r
170 * Spawns a number of dasobert Fetcher threads to add features to sequences in the dataset
\r
172 void startFetching()
\r
175 startTime = System.currentTimeMillis();
\r
178 af.setProgressBar("Fetching DAS Sequence Features", startTime);
\r
181 DasSource[] sources = new jalview.gui.DasSourceBrowser().getDASSource();
\r
183 if (selectedSources == null || selectedSources.size() == 0)
\r
185 String active = jalview.bin.Cache.getDefault("DAS_ACTIVE_SOURCE",
\r
187 StringTokenizer st = new StringTokenizer(active, "\t");
\r
188 Vector selectedSources = new Vector();
\r
190 while (st.hasMoreTokens())
\r
192 token = st.nextToken();
\r
193 for (int i = 0; i < sources.length; i++)
\r
195 if (sources[i].getNickname().equals(token))
\r
197 selectedSources.addElement(sources[i]);
\r
204 if (selectedSources == null || selectedSources.size() == 0)
\r
206 System.out.println("No DAS Sources active");
\r
208 setGuiNoDassourceActive();
\r
212 sourcesRemaining = selectedSources.size();
\r
213 //Now sending requests one at a time to each server
\r
214 for (int sourceIndex = 0; sourceIndex < selectedSources.size()
\r
215 && !cancelled; sourceIndex++)
\r
217 DasSource dasSource = (DasSource) selectedSources
\r
218 .elementAt(sourceIndex);
\r
220 nextSequence(dasSource, sequences[0]);
\r
224 private void setGuiNoDassourceActive()
\r
229 af.setProgressBar("No DAS Sources Active", startTime);
\r
231 if (getFeatSettings()!=null)
\r
233 fsettings.noDasSourceActive();
\r
238 * Update our fsettings dialog reference if we didn't have one when we were first initialised.
\r
239 * @return fsettings
\r
241 private FeatureSettings getFeatSettings()
\r
243 if (fsettings == null)
\r
247 fsettings = af.featureSettings;
\r
253 public void cancel()
\r
257 af.setProgressBar("DAS Feature Fetching Cancelled", startTime);
\r
262 int sourcesRemaining = 0;
\r
264 void responseComplete(DasSource dasSource, SequenceI seq)
\r
268 for (int seqIndex = 0; seqIndex < sequences.length - 1 && !cancelled; seqIndex++)
\r
270 if (sequences[seqIndex] == seq)
\r
272 nextSequence(dasSource, sequences[++seqIndex]);
\r
278 sourcesRemaining--;
\r
280 if (sourcesRemaining == 0)
\r
282 System.err.println("Fetching Complete.");
\r
283 setGuiFetchComplete();
\r
288 private void setGuiFetchComplete()
\r
293 af.setProgressBar("DAS Feature Fetching Complete", startTime);
\r
296 if (af != null && af.featureSettings != null)
\r
298 af.featureSettings.setTableData();
\r
301 if (getFeatSettings() != null)
\r
303 fsettings.complete();
\r
307 void featuresAdded(SequenceI seq)
\r
311 // no gui to update with features.
\r
314 af.getFeatureRenderer().featuresAdded();
\r
316 int start = af.getViewport().getStartSeq();
\r
317 int end = af.getViewport().getEndSeq();
\r
319 for (index = start; index < end; index++)
\r
321 if (seq == af.getViewport().getAlignment().getSequenceAt(index)
\r
322 .getDatasetSequence())
\r
324 af.alignPanel.paintAlignment(true);
\r
330 void nextSequence(DasSource dasSource, SequenceI seq)
\r
334 DBRefEntry[] uprefs = jalview.util.DBRefUtils.selectRefs(
\r
335 seq.getDBRef(), new String[]
\r
337 // jalview.datamodel.DBRefSource.PDB,
\r
338 jalview.datamodel.DBRefSource.UNIPROT,
\r
339 // jalview.datamodel.DBRefSource.EMBL - not tested on any EMBL coord sys sources
\r
341 // TODO: minimal list of DAS queries to make by querying with untyped ID if distinct from any typed IDs
\r
343 boolean dasCoordSysFound = false;
\r
345 if (uprefs != null)
\r
347 // do any of these ids match the source's coordinate system ?
\r
348 for (int j = 0; !dasCoordSysFound && j < uprefs.length; j++)
\r
350 DasCoordinateSystem cs[] = dasSource.getCoordinateSystem();
\r
352 for (int csIndex = 0; csIndex < cs.length && !dasCoordSysFound; csIndex++)
\r
355 && jalview.util.DBRefUtils.isDasCoordinateSystem(
\r
356 cs[csIndex].getName(), uprefs[j]))
\r
358 debug("Launched fetcher for coordinate system "
\r
359 + cs[0].getName());
\r
360 // Will have to pass any mapping information to the fetcher
\r
361 //- the start/end for the DBRefEntry may not be the same as the sequence's start/end
\r
363 System.out.println(seq.getName() + " "
\r
364 + (seq.getDatasetSequence() == null) + " "
\r
365 + dasSource.getUrl());
\r
367 dasCoordSysFound = true; // break's out of the loop
\r
368 createFeatureFetcher(seq, dasSource, uprefs[j]);
\r
371 System.out.println("IGNORE " + cs[csIndex].getName());
\r
376 if (!dasCoordSysFound)
\r
379 // try and use the name as the sequence id
\r
380 if (seq.getName().indexOf("|") > -1)
\r
382 id = seq.getName().substring(seq.getName().lastIndexOf("|") + 1);
\r
383 if (id.trim().length()<4)
\r
385 // hack - we regard a significant ID as being at least 4 non-whitespace characters
\r
386 id = seq.getName().substring(0, seq.getName().lastIndexOf("|"));
\r
387 if (id.indexOf("|")>-1)
\r
389 id = id.substring(id.lastIndexOf("|")+1);
\r
395 id = seq.getName();
\r
399 // Should try to call a general feature fetcher that
\r
400 // queries many sources with name to discover applicable ID references
\r
401 createFeatureFetcher(seq, dasSource, id);
\r
408 * fetch and add das features to a sequence using the given source URL and compatible DbRef id.
\r
409 * new features are mapped using the DbRef mapping to the local coordinate system.
\r
414 protected void createFeatureFetcher(final SequenceI seq,
\r
415 final DasSource dasSource, final DBRefEntry dbref)
\r
419 /// fetch DAS features
\r
420 final Das1Source source = new Das1Source();
\r
421 source.setUrl(dasSource.getUrl());
\r
422 source.setNickname(dasSource.getNickname());
\r
423 if (dbref == null || dbref.getAccessionId() == null
\r
424 || dbref.getAccessionId().length() < 1)
\r
426 responseComplete(dasSource, seq); // reduce thread count anyhow
\r
429 debug("new Das Feature Fetcher for " + dbref.getSource()
\r
430 + ":" + dbref.getAccessionId() + " querying "
\r
431 + dasSource.getUrl());
\r
432 FeatureThread fetcher = new FeatureThread(dbref.getAccessionId()
\r
433 // + ":" + start + "," + end,
\r
436 fetcher.addFeatureListener(new FeatureListener()
\r
438 public void comeBackLater(FeatureEvent e)
\r
440 responseComplete(dasSource, seq);
\r
441 debug("das source " + e.getSource().getNickname()
\r
442 + " asked us to come back in " + e.getComeBackLater()
\r
446 public void newFeatures(FeatureEvent e)
\r
449 Das1Source ds = e.getSource();
\r
451 Map[] features = e.getFeatures();
\r
452 // add features to sequence
\r
453 debug("das source " + ds.getUrl() + " returned "
\r
454 + features.length + " features");
\r
456 if (features.length > 0)
\r
458 for (int i = 0; i < features.length; i++)
\r
460 SequenceFeature f = newSequenceFeature(features[i], source
\r
462 if (dbref.getMap() != null && f.getBegin() > 0
\r
465 debug("mapping from " + f.getBegin() + " - "
\r
467 SequenceFeature vf[] = null;
\r
471 vf = dbref.getMap().locateFeature(f);
\r
472 } catch (Exception ex)
\r
475 .info("Error in 'experimental' mapping of features. Please try to reproduce and then report info to help@jalview.org.");
\r
476 Cache.log.info("Mapping feature from " + f.getBegin()
\r
477 + " to " + f.getEnd() + " in dbref "
\r
478 + dbref.getAccessionId() + " in "
\r
479 + dbref.getSource());
\r
480 Cache.log.info("using das Source " + ds.getUrl());
\r
481 Cache.log.info("Exception", ex);
\r
486 for (int v = 0; v < vf.length; v++)
\r
488 debug("mapping to " + v + ": "
\r
489 + vf[v].getBegin() + " - " + vf[v].getEnd());
\r
490 seq.addSequenceFeature(vf[v]);
\r
496 seq.addSequenceFeature(f);
\r
500 featuresAdded(seq);
\r
504 // System.out.println("No features found for " + seq.getName()
\r
505 // + " from: " + e.getDasSource().getNickname());
\r
507 responseComplete(dasSource, seq);
\r
517 protected void createFeatureFetcher(final SequenceI seq,
\r
518 final DasSource dasSource, String id)
\r
521 /// fetch DAS features
\r
522 final Das1Source source = new Das1Source();
\r
523 source.setUrl(dasSource.getUrl());
\r
524 source.setNickname(dasSource.getNickname());
\r
530 if (id != null && id.length() > 0)
\r
532 debug("new Das Feature Fetcher for " + id + " querying "
\r
533 + dasSource.getUrl());
\r
534 FeatureThread fetcher = new FeatureThread(id
\r
535 // + ":" + start + "," + end,
\r
538 fetcher.addFeatureListener(new FeatureListener()
\r
540 public void comeBackLater(FeatureEvent e)
\r
542 responseComplete(dasSource, seq);
\r
543 debug("das source " + e.getSource().getNickname()
\r
544 + " asked us to come back in " + e.getComeBackLater()
\r
548 public void newFeatures(FeatureEvent e)
\r
551 Das1Source ds = e.getSource();
\r
553 Map[] features = e.getFeatures();
\r
554 // add features to sequence
\r
555 debug("das source " + ds.getUrl() + " returned "
\r
556 + features.length + " features");
\r
558 if (features.length > 0)
\r
560 for (int i = 0; i < features.length; i++)
\r
562 SequenceFeature f = newSequenceFeature(features[i], source
\r
565 seq.addSequenceFeature(f);
\r
568 featuresAdded(seq);
\r
572 // System.out.println("No features found for " + seq.getName()
\r
573 // + " from: " + e.getDasSource().getNickname());
\r
575 responseComplete(dasSource, seq);
\r
584 // invalid fetch - indicate it is finished.
\r
585 debug("Skipping empty ID for querying "
\r
586 + dasSource.getUrl());
\r
587 responseComplete(dasSource, seq);
\r
592 * creates a jalview sequence feature from a das feature document
\r
593 * @param dasfeature
\r
594 * @return sequence feature object created using dasfeature information
\r
596 SequenceFeature newSequenceFeature(Map dasfeature, String nickname)
\r
598 if (dasfeature == null)
\r
605 * Different qNames for a DAS Feature - are string keys to the HashMaps in features
\r
607 qName.equals("TYPE") ||
\r
608 qName.equals("START") ||
\r
609 qName.equals("END") ||
\r
610 qName.equals("NOTE") ||
\r
611 qName.equals("LINK") ||
\r
612 qName.equals("SCORE")
\r
614 String desc = new String();
\r
615 if (dasfeature.containsKey("NOTE"))
\r
617 desc += (String) dasfeature.get("NOTE");
\r
620 int start = 0, end = 0;
\r
625 start = Integer.parseInt(dasfeature.get("START").toString());
\r
626 } catch (Exception ex)
\r
631 end = Integer.parseInt(dasfeature.get("END").toString());
\r
632 } catch (Exception ex)
\r
637 score = Integer.parseInt(dasfeature.get("SCORE").toString());
\r
638 } catch (Exception ex)
\r
642 SequenceFeature f = new SequenceFeature((String) dasfeature
\r
643 .get("TYPE"), desc, start, end, score, nickname);
\r
645 if (dasfeature.containsKey("LINK"))
\r
647 f.addLink(f.getType() + " " + f.begin + "_" + f.end + "|"
\r
648 + dasfeature.get("LINK"));
\r
652 } catch (Exception e)
\r
654 System.out.println("ERRR " + e);
\r
655 e.printStackTrace();
\r
656 System.out.println("############");
\r
657 debug("Failed to parse " + dasfeature.toString(), e);
\r
662 * query the default DAS Source Registry for sources.
\r
663 * Uses value of jalview property DAS_REGISTRY_URL and the DasSourceBrowser.DEFAULT_REGISTRY if that doesn't exist.
\r
664 * @return list of sources
\r
666 public static DasSource[] getDASSources()
\r
669 String registryURL = jalview.bin.Cache.getDefault("DAS_REGISTRY_URL",
\r
670 DasSourceBrowser.DEFAULT_REGISTRY);
\r
671 return getDASSources(registryURL);
\r
674 * query the given URL for DasSources.
\r
675 * @param registryURL
\r
676 * return sources from registryURL
\r
678 public static DasSource[] getDASSources(String registryURL)
\r
680 DasSourceReaderImpl reader = new DasSourceReaderImpl();
\r
684 URL url = new URL(registryURL);
\r
686 DasSource[] sources = reader.readDasSource(url);
\r
688 List das1sources = new ArrayList();
\r
689 for (int i = 0; i < sources.length; i++)
\r
691 DasSource ds = sources[i];
\r
692 if (ds instanceof Das2Source)
\r
694 Das2Source d2s = (Das2Source) ds;
\r
695 if (d2s.hasDas1Capabilities())
\r
697 Das1Source d1s = DasSourceConverter.toDas1Source(d2s);
\r
698 das1sources.add(d1s);
\r
702 else if (ds instanceof Das1Source)
\r
704 das1sources.add((Das1Source) ds);
\r
708 return (Das1Source[]) das1sources.toArray(new Das1Source[das1sources
\r
710 } catch (Exception ex)
\r
712 ex.printStackTrace();
\r