2 * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
3 * Copyright (C) $$Year-Rel$$ The Jalview Authors
5 * This file is part of Jalview.
7 * Jalview is free software: you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation, either version 3
10 * of the License, or (at your option) any later version.
12 * Jalview is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty
14 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
15 * PURPOSE. See the GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Jalview. If not, see <http://www.gnu.org/licenses/>.
19 * The Jalview Authors are detailed in the 'AUTHORS' file.
21 package jalview.ext.ensembl;
23 import jalview.datamodel.AlignmentI;
25 import java.io.BufferedReader;
26 import java.io.IOException;
27 import java.net.MalformedURLException;
29 import java.util.Arrays;
30 import java.util.List;
32 import org.json.simple.JSONObject;
33 import org.json.simple.parser.JSONParser;
34 import org.json.simple.parser.ParseException;
37 * A client for the Ensembl lookup REST endpoint, used to find the gene
38 * identifier given a gene, transcript or protein identifier.
42 public class EnsemblLookup extends EnsemblRestClient
45 * Default constructor (to use rest.ensembl.org)
47 public EnsemblLookup()
53 * Constructor given the target domain to fetch data from
57 public EnsemblLookup(String d)
63 public String getDbName()
69 public AlignmentI getSequenceRecords(String queries) throws Exception
75 protected URL getUrl(List<String> ids) throws MalformedURLException
77 String identifier = ids.get(0);
78 return getUrl(identifier, null);
82 * Gets the url for lookup of the given identifier, optionally with objectType
83 * also specified in the request
89 protected URL getUrl(String identifier, String objectType)
91 String url = getDomain() + "/lookup/id/" + identifier
93 if (objectType != null)
95 url += "&" + OBJECT_TYPE + "=" + objectType;
101 } catch (MalformedURLException e)
108 protected boolean useGetRequest()
114 protected String getRequestMimeType(boolean multipleIds)
116 return "application/json";
120 protected String getResponseMimeType()
122 return "application/json";
126 * Returns the gene id related to the given identifier, which may be for a
127 * gene, transcript or protein
132 public String getGeneId(String identifier)
134 return getGeneId(identifier, null);
138 * Returns the gene id related to the given identifier (which may be for a
139 * gene, transcript or protein)
145 public String getGeneId(String identifier, String objectType)
147 List<String> ids = Arrays.asList(new String[] { identifier });
149 BufferedReader br = null;
152 URL url = getUrl(identifier, objectType);
155 br = getHttpResponse(url, ids);
157 return br == null ? null : parseResponse(br);
158 } catch (IOException e)
169 } catch (IOException e)
178 * Parses the JSON response and returns the gene identifier, or null if not
179 * found. If the returned object_type is Gene, returns the id, if Transcript
180 * returns the Parent. If it is Translation (peptide identifier), then the
181 * Parent is the transcript identifier, so we redo the search with this value.
185 * @throws IOException
187 protected String parseResponse(BufferedReader br) throws IOException
189 String geneId = null;
190 JSONParser jp = new JSONParser();
193 JSONObject val = (JSONObject) jp.parse(br);
194 String type = val.get(OBJECT_TYPE).toString();
195 if (OBJECT_TYPE_GENE.equalsIgnoreCase(type))
197 // got the gene - just returns its id
198 geneId = val.get(ID).toString();
200 else if (OBJECT_TYPE_TRANSCRIPT.equalsIgnoreCase(type))
202 // got the transcript - return its (Gene) Parent
203 geneId = val.get(PARENT).toString();
205 else if (OBJECT_TYPE_TRANSLATION.equalsIgnoreCase(type))
207 // got the protein - get its Parent, restricted to type Transcript
208 String transcriptId = val.get(PARENT).toString();
209 geneId = getGeneId(transcriptId, OBJECT_TYPE_TRANSCRIPT);
211 } catch (ParseException e)