X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=src%2Fjalview%2Fext%2Fensembl%2FEnsemblSymbol.java;h=411a244f4c245a3fd0c2a908f0493a5e0cf5ae48;hb=916c073172d5e374f7375ec718420455472dfcb3;hp=7763f29cc93d560a03ece621b0c138d87a19a914;hpb=853624fb32058cccc544ae7d13af6ad4b0800b6c;p=jalview.git
diff --git a/src/jalview/ext/ensembl/EnsemblSymbol.java b/src/jalview/ext/ensembl/EnsemblSymbol.java
index 7763f29..411a244 100644
--- a/src/jalview/ext/ensembl/EnsemblSymbol.java
+++ b/src/jalview/ext/ensembl/EnsemblSymbol.java
@@ -1,3 +1,23 @@
+/*
+ * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
+ * Copyright (C) $$Year-Rel$$ The Jalview Authors
+ *
+ * This file is part of Jalview.
+ *
+ * Jalview is free software: you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation, either version 3
+ * of the License, or (at your option) any later version.
+ *
+ * Jalview is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty
+ * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
+ * PURPOSE. See the GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Jalview. If not, see .
+ * The Jalview Authors are detailed in the 'AUTHORS' file.
+ */
package jalview.ext.ensembl;
import java.io.BufferedReader;
@@ -5,6 +25,7 @@ import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.ArrayList;
+import java.util.Collections;
import java.util.Iterator;
import java.util.List;
@@ -22,6 +43,11 @@ import org.json.simple.parser.ParseException;
*/
public class EnsemblSymbol extends EnsemblXref
{
+ private static final String COLON = ":";
+ private static final String GENE = "gene";
+ private static final String TYPE = "type";
+ private static final String ID = "id";
+
/**
* Constructor given the target domain to fetch data from
*
@@ -42,8 +68,7 @@ public class EnsemblSymbol extends EnsemblXref
* @return
* @throws IOException
*/
- protected String parseSymbolResponse(BufferedReader br)
- throws IOException
+ protected String parseSymbolResponse(BufferedReader br) throws IOException
{
JSONParser jp = new JSONParser();
String result = null;
@@ -54,8 +79,9 @@ public class EnsemblSymbol extends EnsemblXref
while (rvals.hasNext())
{
JSONObject val = (JSONObject) rvals.next();
- String id = val.get("id").toString();
- if (id != null && isGeneIdentifier(id))
+ String id = val.get(ID).toString();
+ String type = val.get(TYPE).toString();
+ if (id != null && GENE.equals(type))
{
result = id;
break;
@@ -68,12 +94,30 @@ public class EnsemblSymbol extends EnsemblXref
return result;
}
- protected URL getUrl(String id, Species species)
+ /**
+ * Constructs the URL for the REST symbol endpoint
+ *
+ * @param id
+ * the accession id (Ensembl or external)
+ * @param species
+ * a species name recognisable by Ensembl
+ * @param type
+ * an optional type to filter the response (gene, transcript,
+ * translation)
+ * @return
+ */
+ protected URL getUrl(String id, String species, String... type)
{
- String url = getDomain() + "/xrefs/symbol/" + species.toString() + "/"
- + id + "?content-type=application/json";
+ StringBuilder sb = new StringBuilder();
+ sb.append(getDomain()).append("/xrefs/symbol/").append(species)
+ .append("/").append(id).append(CONTENT_TYPE_JSON);
+ for (String t : type)
+ {
+ sb.append("&object_type=").append(t);
+ }
try
{
+ String url = sb.toString();
return new URL(url);
} catch (MalformedURLException e)
{
@@ -82,41 +126,40 @@ public class EnsemblSymbol extends EnsemblXref
}
/**
- * Calls the Ensembl xrefs REST 'symbol' endpoint and retrieves any gene ids
- * for the given identifier, for any known model organisms
+ * Calls the Ensembl xrefs REST 'symbol' endpoint and retrieves gene id(s) for
+ * the given identifier. If the identifier has the format species:symbol then
+ * the gene id for the specified species is returned, else any matched gene ids
+ * for model organisms. If lookup fails, the returned list is empty.
*
* @param identifier
* @return
*/
- public List getIds(String identifier)
+ public List getGeneIds(String identifier)
{
- List result = new ArrayList();
- List ids = new ArrayList();
- ids.add(identifier);
+ List result = new ArrayList<>();
+ List ids = Collections. emptyList();
+ List species = getSpecies(identifier);
- String[] queries = identifier.split(getAccessionSeparator());
+ String symbol = identifier.substring(identifier.indexOf(COLON) + 1);
BufferedReader br = null;
try
{
- for (String query : queries)
- {
- for (Species taxon : Species.values())
+ for (String taxon : species)
{
- if (taxon.isModelOrganism())
+ URL url = getUrl(symbol, taxon, GENE);
+ if (url != null)
{
- URL url = getUrl(query, taxon);
- if (url != null)
- {
- br = getHttpResponse(url, ids);
- }
- String geneId = parseSymbolResponse(br);
- if (geneId != null)
+ br = getHttpResponse(url, ids);
+ if (br != null)
{
- result.add(geneId);
+ String geneId = parseSymbolResponse(br);
+ if (geneId != null && !result.contains(geneId))
+ {
+ result.add(geneId);
+ }
}
}
}
- }
} catch (IOException e)
{
// ignore
@@ -136,4 +179,27 @@ public class EnsemblSymbol extends EnsemblXref
return result;
}
+ /**
+ * Answers a list of species names which is
+ *
+ * - the species in the identifier if it is of the form species:symbol
+ * - else a fixed list of 'model organism' species
+ *
+ *
+ * @param identifier
+ * @return
+ */
+ private List getSpecies(String identifier)
+ {
+ int pos = identifier.indexOf(COLON);
+ if (pos > 0)
+ {
+ return Collections.singletonList(identifier.substring(0, pos));
+ }
+ else
+ {
+ return Species.getModelOrganisms();
+ }
+ }
+
}