2 * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
3 * Copyright (C) $$Year-Rel$$ The Jalview Authors
5 * This file is part of Jalview.
7 * Jalview is free software: you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation, either version 3
10 * of the License, or (at your option) any later version.
12 * Jalview is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty
14 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
15 * PURPOSE. See the GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Jalview. If not, see <http://www.gnu.org/licenses/>.
19 * The Jalview Authors are detailed in the 'AUTHORS' file.
21 package jalview.ext.ensembl;
23 import jalview.bin.Console;
24 import jalview.datamodel.AlignmentI;
25 import jalview.datamodel.GeneLociI;
26 import jalview.datamodel.GeneLocus;
27 import jalview.datamodel.Mapping;
28 import jalview.util.MapList;
30 import java.io.IOException;
31 import java.net.MalformedURLException;
33 import java.util.Arrays;
34 import java.util.Collections;
35 import java.util.List;
38 import org.json.simple.parser.ParseException;
41 * A client for the Ensembl /lookup REST endpoint, used to find the gene
42 * identifier given a gene, transcript or protein identifier, or to extract the
43 * species or chromosomal coordinates from the same service response
47 public class EnsemblLookup extends EnsemblRestClient
49 private static final String SPECIES = "species";
52 * Default constructor (to use rest.ensembl.org)
54 public EnsemblLookup()
60 * Constructor given the target domain to fetch data from
64 public EnsemblLookup(String d)
70 public String getDbName()
76 public AlignmentI getSequenceRecords(String queries) throws Exception
82 protected URL getUrl(List<String> ids) throws MalformedURLException
84 String identifier = ids.get(0);
85 return getUrl(identifier, null);
89 * Gets the url for lookup of the given identifier, optionally with objectType
90 * also specified in the request
96 protected URL getUrl(String identifier, String objectType)
98 String url = getDomain() + "/lookup/id/" + identifier
100 if (objectType != null)
102 url += "&" + OBJECT_TYPE + "=" + objectType;
108 } catch (MalformedURLException e)
115 protected boolean useGetRequest()
121 * Returns the gene id related to the given identifier (which may be for a
122 * gene, transcript or protein), or null if none is found
127 public String getGeneId(String identifier)
129 return getGeneId(identifier, null);
133 * Returns the gene id related to the given identifier (which may be for a
134 * gene, transcript or protein), or null if none is found
140 public String getGeneId(String identifier, String objectType)
142 return parseGeneId(getResult(identifier, objectType));
146 * Parses the JSON response and returns the gene identifier, or null if not
147 * found. If the returned object_type is Gene, returns the id, if Transcript
148 * returns the Parent. If it is Translation (peptide identifier), then the
149 * Parent is the transcript identifier, so we redo the search with this value.
154 protected String parseGeneId(Map<String, Object> val)
160 String geneId = null;
161 String type = val.get(OBJECT_TYPE).toString();
162 if (OBJECT_TYPE_GENE.equalsIgnoreCase(type))
164 // got the gene - just returns its id
165 geneId = val.get(JSON_ID).toString();
167 else if (OBJECT_TYPE_TRANSCRIPT.equalsIgnoreCase(type))
169 // got the transcript - return its (Gene) Parent
170 geneId = val.get(PARENT).toString();
172 else if (OBJECT_TYPE_TRANSLATION.equalsIgnoreCase(type))
174 // got the protein - get its Parent, restricted to type Transcript
175 String transcriptId = val.get(PARENT).toString();
176 geneId = getGeneId(transcriptId, OBJECT_TYPE_TRANSCRIPT);
183 * Calls the Ensembl lookup REST endpoint and retrieves the 'species' for the
184 * given identifier, or null if not found
189 public String getSpecies(String identifier)
191 String species = null;
192 Map<String, Object> json = getResult(identifier, null);
195 Object o = json.get(SPECIES);
198 species = o.toString();
205 * Calls the /lookup/id rest service and returns the response as a Map<String,
206 * Object>, or null if any error
213 @SuppressWarnings("unchecked")
214 protected Map<String, Object> getResult(String identifier,
217 List<String> ids = Arrays.asList(new String[] { identifier });
221 return (Map<String, Object>) getJSON(getUrl(identifier, objectType),
222 ids, -1, MODE_MAP, null);
223 } catch (IOException | ParseException e)
225 jalview.bin.Console.errPrintln("Error parsing " + identifier + " lookup response "
232 * Calls the /lookup/id rest service for the given id, and if successful,
233 * parses and returns the gene's chromosomal coordinates
238 public GeneLociI getGeneLoci(String geneId)
240 return parseGeneLoci(getResult(geneId, OBJECT_TYPE_GENE));
244 * Parses the /lookup/id response for species, asssembly_name,
245 * seq_region_name, start, end and returns an object that wraps them, or null
251 GeneLociI parseGeneLoci(Map<String, Object> json)
260 final String species = json.get("species").toString();
261 final String assembly = json.get("assembly_name").toString();
262 final String chromosome = json.get("seq_region_name").toString();
263 String strand = json.get("strand").toString();
264 int start = Integer.parseInt(json.get("start").toString());
265 int end = Integer.parseInt(json.get("end").toString());
266 int fromEnd = end - start + 1;
267 boolean reverseStrand = "-1".equals(strand);
268 int toStart = reverseStrand ? end : start;
269 int toEnd = reverseStrand ? start : end;
270 List<int[]> fromRange = Collections
271 .singletonList(new int[]
273 List<int[]> toRange = Collections
274 .singletonList(new int[]
276 final Mapping map = new Mapping(
277 new MapList(fromRange, toRange, 1, 1));
278 return new GeneLocus(species == null ? "" : species, assembly,
280 } catch (NullPointerException | NumberFormatException e)
282 Console.error("Error looking up gene loci: " + e.getMessage());