import java.net.MalformedURLException;
import java.net.URL;
import java.util.ArrayList;
+import java.util.Collections;
import java.util.Iterator;
import java.util.List;
*/
public class EnsemblSymbol extends EnsemblXref
{
+ private static final String COLON = ":";
+ private static final String GENE = "gene";
+ private static final String TYPE = "type";
+ private static final String ID = "id";
+
/**
* Constructor given the target domain to fetch data from
*
while (rvals.hasNext())
{
JSONObject val = (JSONObject) rvals.next();
- String id = val.get("id").toString();
- String type = val.get("type").toString();
- if (id != null && "gene".equals(type))
+ String id = val.get(ID).toString();
+ String type = val.get(TYPE).toString();
+ if (id != null && GENE.equals(type))
{
result = id;
break;
* translation)
* @return
*/
- protected URL getUrl(String id, Species species, String... type)
+ protected URL getUrl(String id, String species, String... type)
{
StringBuilder sb = new StringBuilder();
- sb.append(getDomain()).append("/xrefs/symbol/")
- .append(species.toString()).append("/").append(id)
- .append("?content-type=application/json");
+ sb.append(getDomain()).append("/xrefs/symbol/").append(species)
+ .append("/").append(id).append(CONTENT_TYPE_JSON);
for (String t : type)
{
sb.append("&object_type=").append(t);
}
/**
- * Calls the Ensembl xrefs REST 'symbol' endpoint and retrieves any gene ids
- * for the given identifier, for any known model organisms
+ * Calls the Ensembl xrefs REST 'symbol' endpoint and retrieves gene id(s) for
+ * the given identifier. If the identifier has the format species:symbol then
+ * the gene id for the specified species is returned, else any matched gene ids
+ * for model organisms. If lookup fails, the returned list is empty.
*
* @param identifier
* @return
*/
public List<String> getGeneIds(String identifier)
{
- List<String> result = new ArrayList<String>();
- List<String> ids = new ArrayList<String>();
- ids.add(identifier);
+ List<String> result = new ArrayList<>();
+ List<String> ids = Collections.<String> emptyList();
+ List<String> species = getSpecies(identifier);
- String[] queries = identifier.split(getAccessionSeparator());
+ String symbol = identifier.substring(identifier.indexOf(COLON) + 1);
BufferedReader br = null;
try
{
- for (String query : queries)
- {
- for (Species taxon : Species.values())
+ for (String taxon : species)
{
- if (taxon.isModelOrganism())
+ URL url = getUrl(symbol, taxon, GENE);
+ if (url != null)
{
- URL url = getUrl(query, taxon, "gene");
- if (url != null)
+ br = getHttpResponse(url, ids);
+ if (br != null)
{
- br = getHttpResponse(url, ids);
- if (br != null)
+ String geneId = parseSymbolResponse(br);
+ if (geneId != null && !result.contains(geneId))
{
- String geneId = parseSymbolResponse(br);
- if (geneId != null && !result.contains(geneId))
- {
- result.add(geneId);
- }
+ result.add(geneId);
}
}
}
}
- }
} catch (IOException e)
{
// ignore
return result;
}
+ /**
+ * Answers a list of species names which is
+ * <ul>
+ * <li>the species in the identifier if it is of the form species:symbol</li>
+ * <li>else a fixed list of 'model organism' species</li>
+ * </ul>
+ *
+ * @param identifier
+ * @return
+ */
+ private List<String> getSpecies(String identifier)
+ {
+ int pos = identifier.indexOf(COLON);
+ if (pos > 0)
+ {
+ return Collections.singletonList(identifier.substring(0, pos));
+ }
+ else
+ {
+ return Species.getModelOrganisms();
+ }
+ }
+
}