import java.net.MalformedURLException;
import java.net.URL;
import java.util.ArrayList;
+import java.util.Collections;
import java.util.Iterator;
import java.util.List;
*/
public class EnsemblSymbol extends EnsemblXref
{
+ private static final String COLON = ":";
private static final String GENE = "gene";
private static final String TYPE = "type";
private static final String ID = "id";
* translation)
* @return
*/
- protected URL getUrl(String id, Species species, String... type)
+ protected URL getUrl(String id, String species, String... type)
{
StringBuilder sb = new StringBuilder();
- sb.append(getDomain()).append("/xrefs/symbol/")
- .append(species.toString()).append("/").append(id)
- .append(CONTENT_TYPE_JSON);
+ sb.append(getDomain()).append("/xrefs/symbol/").append(species)
+ .append("/").append(id).append(CONTENT_TYPE_JSON);
for (String t : type)
{
sb.append("&object_type=").append(t);
}
/**
- * Calls the Ensembl xrefs REST 'symbol' endpoint and retrieves any gene ids
- * for the given identifier, for any known model organisms
+ * Calls the Ensembl xrefs REST 'symbol' endpoint and retrieves gene id(s) for
+ * the given identifier. If the identifier has the format species:symbol then
+ * the gene id for the specified species is returned, else any matched gene ids
+ * for model organisms. If lookup fails, the returned list is empty.
*
* @param identifier
* @return
*/
public List<String> getGeneIds(String identifier)
{
- List<String> result = new ArrayList<String>();
- List<String> ids = new ArrayList<String>();
- ids.add(identifier);
+ List<String> result = new ArrayList<>();
+ List<String> ids = Collections.<String> emptyList();
+ List<String> species = getSpecies(identifier);
- String[] queries = identifier.split(getAccessionSeparator());
+ String symbol = identifier.substring(identifier.indexOf(COLON) + 1);
BufferedReader br = null;
try
{
- for (String query : queries)
- {
- for (Species taxon : Species.getModelOrganisms())
+ for (String taxon : species)
{
- URL url = getUrl(query, taxon, GENE);
+ URL url = getUrl(symbol, taxon, GENE);
if (url != null)
{
br = getHttpResponse(url, ids);
if (br != null)
{
String geneId = parseSymbolResponse(br);
- System.out.println(url + " returned " + geneId);
if (geneId != null && !result.contains(geneId))
{
result.add(geneId);
}
}
}
- }
} catch (IOException e)
{
// ignore
return result;
}
+ /**
+ * Answers a list of species names which is
+ * <ul>
+ * <li>the species in the identifier if it is of the form species:symbol</li>
+ * <li>else a fixed list of 'model organism' species</li>
+ * </ul>
+ *
+ * @param identifier
+ * @return
+ */
+ private List<String> getSpecies(String identifier)
+ {
+ int pos = identifier.indexOf(COLON);
+ if (pos > 0)
+ {
+ return Collections.singletonList(identifier.substring(0, pos));
+ }
+ else
+ {
+ return Species.getModelOrganisms();
+ }
+ }
+
}