2 * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
3 * Copyright (C) $$Year-Rel$$ The Jalview Authors
5 * This file is part of Jalview.
7 * Jalview is free software: you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation, either version 3
10 * of the License, or (at your option) any later version.
12 * Jalview is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty
14 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
15 * PURPOSE. See the GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Jalview. If not, see <http://www.gnu.org/licenses/>.
19 * The Jalview Authors are detailed in the 'AUTHORS' file.
21 package jalview.ws.seqfetcher;
23 import jalview.bin.Cache;
24 import jalview.datamodel.AlignmentI;
25 import jalview.datamodel.DBRefEntry;
26 import jalview.datamodel.SequenceI;
27 import jalview.util.DBRefUtils;
28 import jalview.util.MessageManager;
30 import java.util.ArrayList;
31 import java.util.Collections;
32 import java.util.Comparator;
33 import java.util.Enumeration;
34 import java.util.HashSet;
35 import java.util.Hashtable;
36 import java.util.List;
38 import java.util.Stack;
39 import java.util.Vector;
41 public class ASequenceFetcher
45 * set of databases we can retrieve entries from
47 protected Hashtable<String, Map<String, DbSourceProxy>> fetchableDbs;
50 * comparator to sort by tier (0/1/2) and name
52 private Comparator<DbSourceProxy> proxyComparator;
57 public ASequenceFetcher()
62 * comparator to sort proxies by tier and name
64 proxyComparator = new Comparator<DbSourceProxy>()
67 public int compare(DbSourceProxy o1, DbSourceProxy o2)
70 * Tier 0 precedes 1 precedes 2
72 int compared = Integer.compare(o1.getTier(), o2.getTier());
75 // defend against NullPointer - should never happen
76 String o1Name = o1.getDbName();
77 String o2Name = o2.getDbName();
78 if (o1Name != null && o2Name != null)
80 compared = o1Name.compareToIgnoreCase(o2Name);
89 * get array of supported Databases
91 * @return database source string for each database - only the latest version
92 * of a source db is bound to each source.
94 public String[] getSupportedDb()
96 if (fetchableDbs == null)
100 String[] sf = fetchableDbs.keySet().toArray(
101 new String[fetchableDbs.size()]);
105 public boolean isFetchable(String source)
107 for (String db : fetchableDbs.keySet())
109 if (source.equalsIgnoreCase(db))
114 Cache.log.warn("isFetchable doesn't know about '" + source
120 * Fetch sequences for the given cross-references
124 * if true, only fetch from nucleotide data sources, else peptide
127 public SequenceI[] getSequences(DBRefEntry[] refs, boolean dna)
129 Vector<SequenceI> rseqs = new Vector<SequenceI>();
130 Hashtable<String, List<String>> queries = new Hashtable<String, List<String>>();
131 for (int r = 0; r < refs.length; r++)
133 if (!queries.containsKey(refs[r].getSource()))
135 queries.put(refs[r].getSource(), new ArrayList<String>());
137 List<String> qset = queries.get(refs[r].getSource());
138 if (!qset.contains(refs[r].getAccessionId()))
140 qset.add(refs[r].getAccessionId());
143 Enumeration<String> e = queries.keys();
144 while (e.hasMoreElements())
146 List<String> query = null;
148 db = e.nextElement();
149 query = queries.get(db);
150 if (!isFetchable(db))
152 reportStdError(db, query, new Exception(
153 "Don't know how to fetch from this database :" + db));
157 Stack<String> queriesLeft = new Stack<String>();
158 queriesLeft.addAll(query);
160 List<DbSourceProxy> proxies = getSourceProxy(db);
161 for (DbSourceProxy fetcher : proxies)
163 List<String> queriesMade = new ArrayList<String>();
164 HashSet<String> queriesFound = new HashSet<String>();
167 if (fetcher.isDnaCoding() != dna)
169 continue; // wrong sort of data
171 boolean doMultiple = fetcher.getMaximumQueryCount() > 1;
172 while (!queriesLeft.isEmpty())
174 StringBuffer qsb = new StringBuffer();
177 if (qsb.length() > 0)
179 qsb.append(fetcher.getAccessionSeparator());
181 String q = queriesLeft.pop();
184 } while (doMultiple && !queriesLeft.isEmpty());
186 AlignmentI seqset = null;
189 // create a fetcher and go to it
190 seqset = fetcher.getSequenceRecords(qsb.toString());
191 } catch (Exception ex)
193 System.err.println("Failed to retrieve the following from "
195 System.err.println(qsb);
196 ex.printStackTrace(System.err);
198 // TODO: Merge alignment together - perhaps
201 SequenceI seqs[] = seqset.getSequencesArray();
204 for (int is = 0; is < seqs.length; is++)
206 rseqs.addElement(seqs[is]);
207 DBRefEntry[] frefs = DBRefUtils.searchRefs(seqs[is]
208 .getDBRefs(), new DBRefEntry(db, null, null));
211 for (DBRefEntry dbr : frefs)
213 queriesFound.add(dbr.getAccessionId());
214 queriesMade.remove(dbr.getAccessionId());
222 if (fetcher.getRawRecords() != null)
224 System.out.println("# Retrieved from " + db + ":"
226 StringBuffer rrb = fetcher.getRawRecords();
228 * for (int rr = 0; rr<rrb.length; rr++) {
233 hdr = "# " + db + ":" + qsb.toString();
235 * } else { hdr = "# part "+rr; }
237 System.out.println(hdr);
240 System.out.println(rrb);
242 System.out.println("# end of " + hdr);
249 } catch (Exception ex)
251 reportStdError(db, queriesMade, ex);
253 if (queriesMade.size() > 0)
255 System.out.println("# Adding " + queriesMade.size()
256 + " ids back to queries list for searching again (" + db
258 queriesLeft.addAll(queriesMade);
263 SequenceI[] result = null;
264 if (rseqs.size() > 0)
266 result = new SequenceI[rseqs.size()];
268 for (SequenceI s : rseqs)
277 public void reportStdError(String db, List<String> queriesMade,
281 System.err.println("Failed to retrieve the following references from "
284 for (String qv : queriesMade)
286 System.err.print(" " + qv + ";");
289 System.err.println();
293 System.err.println();
294 ex.printStackTrace();
298 * Returns a list of proxies for the given source
301 * database source string TODO: add version string/wildcard for
302 * retrieval of specific DB source/version combinations.
303 * @return a list of DbSourceProxy for the db
305 public List<DbSourceProxy> getSourceProxy(String db)
307 db = DBRefUtils.getCanonicalName(db);
308 Map<String, DbSourceProxy> dblist = fetchableDbs.get(db);
311 return new ArrayList<DbSourceProxy>();
315 * sort so that primary sources precede secondary
317 List<DbSourceProxy> dbs = new ArrayList<DbSourceProxy>(dblist.values());
318 Collections.sort(dbs, proxyComparator);
323 * constructs an instance of the proxy and registers it as a valid dbrefsource
325 * @param dbSourceProxy
326 * reference for class implementing
327 * jalview.ws.seqfetcher.DbSourceProxy
329 protected void addDBRefSourceImpl(
330 Class<? extends DbSourceProxy> dbSourceProxy)
331 throws IllegalArgumentException
333 DbSourceProxy proxy = null;
336 DbSourceProxy proxyObj = dbSourceProxy.getConstructor().newInstance();
338 } catch (IllegalArgumentException e)
341 } catch (Exception e)
343 // Serious problems if this happens.
346 .getString("error.dbrefsource_implementation_exception"),
349 addDbRefSourceImpl(proxy);
353 * add the properly initialised DbSourceProxy object 'proxy' to the list of
358 protected void addDbRefSourceImpl(DbSourceProxy proxy)
362 if (fetchableDbs == null)
364 fetchableDbs = new Hashtable<String, Map<String, DbSourceProxy>>();
366 Map<String, DbSourceProxy> slist = fetchableDbs.get(proxy
370 fetchableDbs.put(proxy.getDbSource(),
371 slist = new Hashtable<String, DbSourceProxy>());
373 slist.put(proxy.getDbName(), proxy);
378 * select sources which are implemented by instances of the given class
380 * @param class that implements DbSourceProxy
381 * @return null or vector of source names for fetchers
383 public String[] getDbInstances(Class class1)
385 if (!DbSourceProxy.class.isAssignableFrom(class1))
390 "error.implementation_error_dbinstance_must_implement_interface",
391 new String[] { class1.toString() }));
393 if (fetchableDbs == null)
397 String[] sources = null;
398 Vector<String> src = new Vector<String>();
399 Enumeration<String> dbs = fetchableDbs.keys();
400 while (dbs.hasMoreElements())
402 String dbn = dbs.nextElement();
403 for (DbSourceProxy dbp : fetchableDbs.get(dbn).values())
405 if (class1.isAssignableFrom(dbp.getClass()))
413 src.copyInto(sources = new String[src.size()]);
418 public DbSourceProxy[] getDbSourceProxyInstances(Class class1)
420 List<DbSourceProxy> prlist = new ArrayList<DbSourceProxy>();
421 for (String fetchable : getSupportedDb())
423 for (DbSourceProxy pr : getSourceProxy(fetchable))
425 if (class1.isInstance(pr))
431 if (prlist.size() == 0)
435 return prlist.toArray(new DbSourceProxy[0]);