2 * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
3 * Copyright (C) $$Year-Rel$$ The Jalview Authors
5 * This file is part of Jalview.
7 * Jalview is free software: you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation, either version 3
10 * of the License, or (at your option) any later version.
12 * Jalview is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty
14 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
15 * PURPOSE. See the GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Jalview. If not, see <http://www.gnu.org/licenses/>.
19 * The Jalview Authors are detailed in the 'AUTHORS' file.
21 package jalview.ws.seqfetcher;
23 import jalview.api.FeatureSettingsModelI;
24 import jalview.bin.Cache;
25 import jalview.datamodel.AlignmentI;
26 import jalview.datamodel.DBRefEntry;
27 import jalview.datamodel.SequenceI;
28 import jalview.util.DBRefUtils;
29 import jalview.util.MessageManager;
31 import java.util.ArrayList;
32 import java.util.Collections;
33 import java.util.Comparator;
34 import java.util.Enumeration;
35 import java.util.HashSet;
36 import java.util.Hashtable;
37 import java.util.List;
39 import java.util.Stack;
40 import java.util.Vector;
42 public class ASequenceFetcher
46 * set of databases we can retrieve entries from
48 protected Hashtable<String, Map<String, DbSourceProxy>> fetchableDbs;
51 * comparator to sort by tier (0/1/2) and name
53 private Comparator<DbSourceProxy> proxyComparator;
58 protected ASequenceFetcher()
63 * comparator to sort proxies by tier and name
65 proxyComparator = new Comparator<DbSourceProxy>()
68 public int compare(DbSourceProxy o1, DbSourceProxy o2)
71 * Tier 0 precedes 1 precedes 2
73 int compared = Integer.compare(o1.getTier(), o2.getTier());
76 // defend against NullPointer - should never happen
77 String o1Name = o1.getDbName();
78 String o2Name = o2.getDbName();
79 if (o1Name != null && o2Name != null)
81 compared = o1Name.compareToIgnoreCase(o2Name);
90 * get array of supported Databases
92 * @return database source string for each database - only the latest version
93 * of a source db is bound to each source.
95 public String[] getSupportedDb()
97 if (fetchableDbs == null)
101 String[] sf = fetchableDbs.keySet()
102 .toArray(new String[fetchableDbs.size()]);
106 public boolean isFetchable(String source)
108 for (String db : fetchableDbs.keySet())
110 if (source.equalsIgnoreCase(db))
115 Cache.log.warn("isFetchable doesn't know about '" + source + "'");
120 * Fetch sequences for the given cross-references
124 * if true, only fetch from nucleotide data sources, else peptide
127 public SequenceI[] getSequences(List<DBRefEntry> refs, boolean dna)
129 Vector<SequenceI> rseqs = new Vector<>();
130 Hashtable<String, List<String>> queries = new Hashtable<>();
131 for (DBRefEntry ref : refs)
133 String canonical = DBRefUtils.getCanonicalName(ref.getSource());
134 if (!queries.containsKey(canonical))
136 queries.put(canonical, new ArrayList<String>());
138 List<String> qset = queries.get(canonical);
139 if (!qset.contains(ref.getAccessionId()))
141 qset.add(ref.getAccessionId());
144 Enumeration<String> e = queries.keys();
145 while (e.hasMoreElements())
147 List<String> query = null;
149 db = e.nextElement();
150 query = queries.get(db);
151 if (!isFetchable(db))
153 reportStdError(db, query, new Exception(
154 "Don't know how to fetch from this database :" + db));
158 Stack<String> queriesLeft = new Stack<>();
159 queriesLeft.addAll(query);
161 List<DbSourceProxy> proxies = getSourceProxy(db);
162 for (DbSourceProxy fetcher : proxies)
164 List<String> queriesMade = new ArrayList<>();
165 HashSet<String> queriesFound = new HashSet<>();
168 if (fetcher.isDnaCoding() != dna)
170 continue; // wrong sort of data
172 boolean doMultiple = fetcher.getMaximumQueryCount() > 1;
173 while (!queriesLeft.isEmpty())
175 StringBuffer qsb = new StringBuffer();
178 if (qsb.length() > 0)
180 qsb.append(fetcher.getAccessionSeparator());
182 String q = queriesLeft.pop();
185 } while (doMultiple && !queriesLeft.isEmpty());
187 AlignmentI seqset = null;
190 // create a fetcher and go to it
191 seqset = fetcher.getSequenceRecords(qsb.toString());
192 } catch (Exception ex)
195 "Failed to retrieve the following from " + db);
196 System.err.println(qsb);
197 ex.printStackTrace(System.err);
199 // TODO: Merge alignment together - perhaps
202 SequenceI seqs[] = seqset.getSequencesArray();
205 for (int is = 0; is < seqs.length; is++)
207 rseqs.addElement(seqs[is]);
208 List<DBRefEntry> frefs = DBRefUtils.searchRefs(
209 seqs[is].getDBRefs(),
210 new DBRefEntry(db, null, null));
211 for (DBRefEntry dbr : frefs)
213 queriesFound.add(dbr.getAccessionId());
214 queriesMade.remove(dbr.getAccessionId());
221 if (fetcher.getRawRecords() != null)
224 "# Retrieved from " + db + ":" + qsb.toString());
225 StringBuffer rrb = fetcher.getRawRecords();
227 * for (int rr = 0; rr<rrb.length; rr++) {
232 hdr = "# " + db + ":" + qsb.toString();
234 * } else { hdr = "# part "+rr; }
236 System.out.println(hdr);
239 System.out.println(rrb);
241 System.out.println("# end of " + hdr);
248 } catch (Exception ex)
250 reportStdError(db, queriesMade, ex);
252 if (queriesMade.size() > 0)
254 System.out.println("# Adding " + queriesMade.size()
255 + " ids back to queries list for searching again (" + db
257 queriesLeft.addAll(queriesMade);
262 SequenceI[] result = null;
263 if (rseqs.size() > 0)
265 result = new SequenceI[rseqs.size()];
267 for (SequenceI s : rseqs)
276 public void reportStdError(String db, List<String> queriesMade,
281 "Failed to retrieve the following references from " + db);
283 for (String qv : queriesMade)
285 System.err.print(" " + qv + ";");
288 System.err.println();
292 System.err.println();
293 ex.printStackTrace();
297 * Returns a list of proxies for the given source
300 * database source string TODO: add version string/wildcard for
301 * retrieval of specific DB source/version combinations.
302 * @return a list of DbSourceProxy for the db
304 public List<DbSourceProxy> getSourceProxy(String db)
306 db = DBRefUtils.getCanonicalName(db);
307 Map<String, DbSourceProxy> dblist = fetchableDbs.get(db);
310 return new ArrayList<>();
314 * sort so that primary sources precede secondary
316 List<DbSourceProxy> dbs = new ArrayList<>(dblist.values());
317 Collections.sort(dbs, proxyComparator);
322 * constructs an instance of the proxy and registers it as a valid dbrefsource
324 * @param dbSourceProxy
325 * reference for class implementing
326 * jalview.ws.seqfetcher.DbSourceProxy
328 protected void addDBRefSourceImpl(
329 Class<? extends DbSourceProxy> dbSourceProxy)
330 throws IllegalArgumentException
332 DbSourceProxy proxy = null;
335 DbSourceProxy proxyObj = dbSourceProxy.getConstructor().newInstance();
337 } catch (IllegalArgumentException e)
340 } catch (Exception e)
342 // Serious problems if this happens.
343 throw new Error(MessageManager
344 .getString("error.dbrefsource_implementation_exception"), e);
346 addDbRefSourceImpl(proxy);
350 * add the properly initialised DbSourceProxy object 'proxy' to the list of
355 protected void addDbRefSourceImpl(DbSourceProxy proxy)
359 if (fetchableDbs == null)
361 fetchableDbs = new Hashtable<>();
363 Map<String, DbSourceProxy> slist = fetchableDbs
364 .get(proxy.getDbSource());
367 fetchableDbs.put(proxy.getDbSource(),
368 slist = new Hashtable<>());
370 slist.put(proxy.getDbName(), proxy);
375 * select sources which are implemented by instances of the given class
378 * that implements DbSourceProxy
379 * @return null or vector of source names for fetchers
381 public String[] getDbInstances(Class class1)
383 if (!DbSourceProxy.class.isAssignableFrom(class1))
385 throw new Error(MessageManager.formatMessage(
386 "error.implementation_error_dbinstance_must_implement_interface",
388 { class1.toString() }));
390 if (fetchableDbs == null)
394 String[] sources = null;
395 Vector<String> src = new Vector<>();
396 Enumeration<String> dbs = fetchableDbs.keys();
397 while (dbs.hasMoreElements())
399 String dbn = dbs.nextElement();
400 for (DbSourceProxy dbp : fetchableDbs.get(dbn).values())
402 if (class1.isAssignableFrom(dbp.getClass()))
410 src.copyInto(sources = new String[src.size()]);
415 public DbSourceProxy[] getDbSourceProxyInstances(Class class1)
417 List<DbSourceProxy> prlist = new ArrayList<>();
418 for (String fetchable : getSupportedDb())
420 for (DbSourceProxy pr : getSourceProxy(fetchable))
422 if (class1.isInstance(pr))
428 if (prlist.size() == 0)
432 return prlist.toArray(new DbSourceProxy[0]);
436 * Returns a preferred feature colouring scheme for the given source, or null
437 * if none is defined.
442 public FeatureSettingsModelI getFeatureColourScheme(String source)
445 * return the first non-null colour scheme for any proxy for
446 * this database source
448 for (DbSourceProxy proxy : getSourceProxy(source))
450 FeatureSettingsModelI preferredColours = proxy
451 .getFeatureColourScheme();
452 if (preferredColours != null)
454 return preferredColours;