2 * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
3 * Copyright (C) $$Year-Rel$$ The Jalview Authors
5 * This file is part of Jalview.
7 * Jalview is free software: you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation, either version 3
10 * of the License, or (at your option) any later version.
12 * Jalview is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty
14 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
15 * PURPOSE. See the GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Jalview. If not, see <http://www.gnu.org/licenses/>.
19 * The Jalview Authors are detailed in the 'AUTHORS' file.
21 package jalview.ws.dbsources;
23 import jalview.util.MessageManager;
24 import jalview.ws.uimodel.PDBRestRequest;
25 import jalview.ws.uimodel.PDBRestResponse;
26 import jalview.ws.uimodel.PDBRestResponse.PDBResponseSummary;
28 import java.util.ArrayList;
29 import java.util.Collection;
30 import java.util.Iterator;
31 import java.util.List;
33 import javax.ws.rs.core.MediaType;
35 import org.json.simple.JSONArray;
36 import org.json.simple.JSONObject;
37 import org.json.simple.parser.JSONParser;
38 import org.json.simple.parser.ParseException;
40 import com.sun.jersey.api.client.Client;
41 import com.sun.jersey.api.client.ClientResponse;
42 import com.sun.jersey.api.client.WebResource;
43 import com.sun.jersey.api.client.config.ClientConfig;
44 import com.sun.jersey.api.client.config.DefaultClientConfig;
47 * A rest client for querying the Search endpoing of the PDB REST API
52 public class PDBRestClient
54 public static final String PDB_SEARCH_ENDPOINT = "http://www.ebi.ac.uk/pdbe/search/pdb/select?";
56 private static int DEFAULT_RESPONSE_SIZE = 200;
59 * Takes a PDBRestRequest object and returns a response upon execution
61 * @param pdbRestRequest
62 * the PDBRestRequest instance to be processed
63 * @return the pdbResponse object for the given request
66 public PDBRestResponse executeRequest(PDBRestRequest pdbRestRequest)
71 ClientConfig clientConfig = new DefaultClientConfig();
72 Client client = Client.create(clientConfig);
74 String wantedFields = getPDBDocFieldsAsCommaDelimitedString(pdbRestRequest
76 int responseSize = (pdbRestRequest.getResponseSize() == 0) ? DEFAULT_RESPONSE_SIZE
77 : pdbRestRequest.getResponseSize();
78 String sortParam = null;
79 if (pdbRestRequest.getFieldToSortBy() == null
80 || pdbRestRequest.getFieldToSortBy().trim().isEmpty())
86 if (pdbRestRequest.getFieldToSortBy()
87 .equalsIgnoreCase("Resolution"))
89 sortParam = pdbRestRequest.getFieldToSortBy()
90 + (pdbRestRequest.isAscending() ? " asc" : " desc");
94 sortParam = pdbRestRequest.getFieldToSortBy()
95 + (pdbRestRequest.isAscending() ? " desc" : " asc");
99 String facetPivot = (pdbRestRequest.getFacetPivot() == null || pdbRestRequest
100 .getFacetPivot().isEmpty()) ? "" : pdbRestRequest
102 String facetPivotMinCount = String.valueOf(pdbRestRequest
103 .getFacetPivotMinCount());
105 // Build request parameters for the REST Request
106 WebResource webResource = null;
107 if (pdbRestRequest.isFacet())
109 webResource = client.resource(PDB_SEARCH_ENDPOINT)
110 .queryParam("wt", "json").queryParam("fl", wantedFields)
111 .queryParam("rows", String.valueOf(responseSize))
112 .queryParam("q", pdbRestRequest.getQuery())
113 .queryParam("sort", sortParam).queryParam("facet", "true")
114 .queryParam("facet.pivot", facetPivot)
115 .queryParam("facet.pivot.mincount", facetPivotMinCount);
119 webResource = client.resource(PDB_SEARCH_ENDPOINT)
120 .queryParam("wt", "json").queryParam("fl", wantedFields)
121 .queryParam("rows", String.valueOf(responseSize))
122 .queryParam("q", pdbRestRequest.getQuery())
123 .queryParam("sort", sortParam);
125 // Execute the REST request
126 ClientResponse clientResponse = webResource.accept(
127 MediaType.APPLICATION_JSON).get(ClientResponse.class);
129 // Get the JSON string from the response object
130 String responseString = clientResponse.getEntity(String.class);
131 // System.out.println("query >>>>>>> " + pdbRestRequest.toString());
133 // Check the response status and report exception if one occurs
134 if (clientResponse.getStatus() != 200)
136 String errorMessage = "";
137 if (clientResponse.getStatus() == 400)
139 errorMessage = parseJsonExceptionString(responseString);
140 throw new Exception(errorMessage);
144 errorMessage = getMessageByHTTPStatusCode(clientResponse
146 throw new Exception(errorMessage);
150 // Make redundant objects eligible for garbage collection to conserve
152 clientResponse = null;
155 // Process the response and return the result to the caller.
156 return parsePDBJsonResponse(responseString, pdbRestRequest);
157 } catch (Exception e)
159 String exceptionMsg = e.getMessage();
160 if (exceptionMsg.contains("SocketException"))
162 // No internet connection
165 .getString("exception.unable_to_detect_internet_connection"));
167 else if (exceptionMsg.contains("UnknownHostException"))
169 // The server 'www.ebi.ac.uk' is unreachable
172 .getString("exception.pdb_server_unreachable"));
181 public String getMessageByHTTPStatusCode(int code)
187 message = MessageManager
188 .getString("exception.pdb_rest_service_no_longer_available");
192 message = MessageManager.getString("exception.resource_not_be_found");
202 message = MessageManager.getString("exception.pdb_server_error");
212 * Process error response from PDB server if/when one occurs.
214 * @param jsonResponse
215 * the JSON string containing error message from the server
216 * @return the processed error message from the JSON string
218 public static String parseJsonExceptionString(String jsonErrorResponse)
220 StringBuilder errorMessage = new StringBuilder(
221 "\n============= PDB Rest Client RunTime error =============\n");
225 JSONParser jsonParser = new JSONParser();
226 JSONObject jsonObj = (JSONObject) jsonParser.parse(jsonErrorResponse);
227 JSONObject errorResponse = (JSONObject) jsonObj.get("error");
229 JSONObject responseHeader = (JSONObject) jsonObj
230 .get("responseHeader");
231 JSONObject paramsObj = (JSONObject) responseHeader.get("params");
232 String status = responseHeader.get("status").toString();
233 String message = errorResponse.get("msg").toString();
234 String query = paramsObj.get("q").toString();
235 String fl = paramsObj.get("fl").toString();
237 errorMessage.append("Status: ").append(status).append("\n");
238 errorMessage.append("Message: ").append(message).append("\n");
239 errorMessage.append("query: ").append(query).append("\n");
240 errorMessage.append("fl: ").append(fl).append("\n");
242 } catch (ParseException e)
246 return errorMessage.toString();
250 * Parses the JSON response string from PDB REST API. The response is dynamic
251 * hence, only fields specifically requested for in the 'wantedFields'
252 * parameter is fetched/processed
254 * @param pdbJsonResponseString
255 * the JSON string to be parsed
256 * @param pdbRestRequest
257 * the request object which contains parameters used to process the
261 @SuppressWarnings("unchecked")
262 public static PDBRestResponse parsePDBJsonResponse(
263 String pdbJsonResponseString, PDBRestRequest pdbRestRequest)
265 PDBRestResponse searchResult = new PDBRestResponse();
266 List<PDBResponseSummary> result = null;
269 JSONParser jsonParser = new JSONParser();
270 JSONObject jsonObj = (JSONObject) jsonParser
271 .parse(pdbJsonResponseString);
273 JSONObject pdbResponse = (JSONObject) jsonObj.get("response");
274 String queryTime = ((JSONObject) jsonObj.get("responseHeader")).get(
276 int numFound = Integer
277 .valueOf(pdbResponse.get("numFound").toString());
280 result = new ArrayList<PDBResponseSummary>();
281 JSONArray docs = (JSONArray) pdbResponse.get("docs");
282 for (Iterator<JSONObject> docIter = docs.iterator(); docIter
285 JSONObject doc = docIter.next();
286 result.add(searchResult.new PDBResponseSummary(doc,
289 searchResult.setNumberOfItemsFound(numFound);
290 searchResult.setResponseTime(queryTime);
291 searchResult.setSearchSummary(result);
293 } catch (ParseException e)
301 * Takes a collection of PDBDocField and converts its 'code' Field values into
302 * a comma delimited string.
304 * @param pdbDocfields
305 * the collection of PDBDocField to process
306 * @return the comma delimited string from the pdbDocFields collection
308 public static String getPDBDocFieldsAsCommaDelimitedString(
309 Collection<PDBDocField> pdbDocfields)
312 if (pdbDocfields != null && !pdbDocfields.isEmpty())
314 StringBuilder returnedFields = new StringBuilder();
315 for (PDBDocField field : pdbDocfields)
317 returnedFields.append(",").append(field.getCode());
319 returnedFields.deleteCharAt(0);
320 result = returnedFields.toString();
326 * Determines the column index for 'PDB Id' Fields in the dynamic summary
327 * table. The PDB Id serves as a unique identifier for a given row in the
330 * @param wantedFields
331 * the available table columns in no particular order
332 * @return the pdb id field column index
334 public static int getPDBIdColumIndex(
335 Collection<PDBDocField> wantedFields, boolean hasRefSeq)
338 // If a reference sequence is attached then start counting from 1 else
340 int pdbFieldIndexCounter = hasRefSeq ? 1 : 0;
342 for (PDBDocField field : wantedFields)
344 if (field.equals(PDBDocField.PDB_ID))
346 break; // Once PDB Id index is determined exit iteration
348 ++pdbFieldIndexCounter;
350 return pdbFieldIndexCounter;
353 public static PDBDocField getPDBDocFieldByCode(String fieldCode)
356 for (PDBDocField curPDBDocField : PDBDocField.values())
358 if (curPDBDocField.getCode().equalsIgnoreCase(fieldCode))
360 return curPDBDocField;
363 throw new Exception("PDB doc Field not found!");
367 * This enum represents the fields available in the PDB JSON response
370 public enum PDBDocField
372 PDB_ID("PDB Id", "pdb_id"), TITLE("Title", "title"), MOLECULE_NAME(
373 "Molecule", "molecule_name"), MOLECULE_TYPE("Molecule Type",
374 "molecule_type"), MOLECULE_SEQUENCE("Sequence",
375 "molecule_sequence"), PFAM_ACCESSION("PFAM Accession",
376 "pfam_accession"), PFAM_NAME("PFAM Name", "pfam_name"), INTERPRO_NAME(
377 "InterPro Name", "interpro_name"), INTERPRO_ACCESSION(
378 "InterPro Accession", "interpro_accession"), UNIPROT_ID(
379 "UniProt Id", "uniprot_id"), UNIPROT_ACCESSION(
380 "UniProt Accession", "uniprot_accession"), UNIPROT_COVERAGE(
381 "UniProt Coverage", "uniprot_coverage"), UNIPROT_FEATURES(
382 "Uniprot Features", "uniprot_features"), R_FACTOR("R Factor",
383 "r_factor"), RESOLUTION("Resolution", "resolution"), DATA_QUALITY(
384 "Data Quality", "data_quality"), OVERALL_QUALITY(
385 "Overall Quality", "overall_quality"), POLYMER_COUNT(
386 "Number of Polymers", "number_of_polymers"), PROTEIN_CHAIN_COUNT(
387 "Number of Protein Chains", "number_of_protein_chains"), BOUND_MOLECULE_COUNT(
388 "Number of Bound Molecule", "number_of_bound_molecules"), POLYMER_RESIDUE_COUNT(
389 "Number of Polymer Residue", "number_of_polymer_residues"), GENUS(
390 "GENUS", "genus"), GENE_NAME("Gene Name", "gene_name"), EXPERIMENTAL_METHOD(
391 "Experimental Method", "experimental_method"), GO_ID("GO Id",
392 "go_id"), ASSEMBLY_ID("Assembly Id", "assembly_form"), ASSEMBLY_FORM(
393 "Assembly Form", "assembly_id"), ASSEMBLY_TYPE("Assembly Type",
394 "assembly_type"), SPACE_GROUP("Space Group", "spacegroup"), CATH_CODE(
395 "Cath Code", "cath_code"), TAX_ID("Tax Id", "tax_id"), TAX_QUERY(
396 "Tax Query", "tax_query"), INTERACTING_ENTRY_ID(
397 "Interacting Entry Id", "interacting_entry_id"), INTERACTING_ENTITY_ID(
398 "Interacting Entity Id", "interacting_entity_id"), INTERACTING_MOLECULES(
399 "Interacting Molecules", "interacting_molecules"), PUBMED_ID(
400 "Pubmed Id", "pubmed_id"), STATUS("Status", "status"), MODEL_QUALITY(
401 "Model Quality", "model_quality"), PIVOT_RESOLUTION(
402 "Pivot Resolution", "pivot_resolution"), DATA_REDUCTION_SOFTWARE(
403 "Data reduction software", "data_reduction_software"), MAX_OBSERVED_RES(
404 "Max observed residues", "max_observed_residues"), ORG_SCI_NAME(
405 "Organism scientific name", "organism_scientific_name"), SUPER_KINGDOM(
406 "Super kingdom", "superkingdom"), RANK("Rank", "rank"), CRYSTALLISATION_PH(
407 "Crystallisation Ph", "crystallisation_ph"), BIOLOGICAL_FUNCTION(
408 "Biological Function", "biological_function"), BIOLOGICAL_PROCESS(
409 "Biological Process", "biological_process"), BIOLOGICAL_CELL_COMPONENT(
410 "Biological Cell Component", "biological_cell_component"), COMPOUND_NAME(
411 "Compound Name", "compound_name"), COMPOUND_ID("Compound Id",
412 "compound_id"), COMPOUND_WEIGHT("Compound Weight",
413 "compound_weight"), COMPOUND_SYSTEMATIC_NAME(
414 "Compound Systematic Name", "compound_systematic_name"), INTERACTING_LIG(
415 "Interacting Ligands", "interacting_ligands"), JOURNAL(
416 "Journal", "journal"), ALL_AUTHORS("All Authors", "all_authors"), EXPERIMENTAL_DATA_AVAILABLE(
417 "Experiment Data Available", "experiment_data_available"), DIFFRACTION_PROTOCOL(
418 "Diffraction Protocol", "diffraction_protocol"), REFINEMENT_SOFTWARE(
419 "Refinement Software", "refinement_software"), STRUCTURE_DETERMINATION_METHOD(
420 "Structure Determination Method",
421 "structure_determination_method"), SYNCHROTON_SITE(
422 "Synchrotron Site", "synchrotron_site"), SAMPLE_PREP_METHOD(
423 "Sample Preparation Method", "sample_preparation_method"), ENTRY_AUTHORS(
424 "Entry Authors", "entry_authors"), CITATION_TITLE(
425 "Citation Title", "citation_title"), STRUCTURE_SOLUTION_SOFTWARE(
426 "Structure Solution Software", "structure_solution_software"), ENTRY_ENTITY(
427 "Entry Entity", "entry_entity"), R_FREE("R Free", "r_free"), NO_OF_POLYMER_ENTITIES(
428 "Number of Polymer Entities", "number_of_polymer_entities"), NO_OF_BOUND_ENTITIES(
429 "Number of Bound Entities", "number_of_bound_entities"), CRYSTALLISATION_RESERVOIR(
430 "Crystallisation Reservoir", "crystallisation_reservoir"), DATA_SCALING_SW(
431 "Data Scalling Software", "data_scaling_software"), DETECTOR(
432 "Detector", "detector"), DETECTOR_TYPE("Detector Type",
433 "detector_type"), MODIFIED_RESIDUE_FLAG(
434 "Modified Residue Flag", "modified_residue_flag"), NUMBER_OF_COPIES(
435 "Number of Copies", "number_of_copies"), STRUCT_ASYM_ID(
436 "Struc Asym Id", "struct_asym_id"), HOMOLOGUS_PDB_ENTITY_ID(
437 "Homologus PDB Entity Id", "homologus_pdb_entity_id"), MOLECULE_SYNONYM(
438 "Molecule Synonym", "molecule_synonym"), DEPOSITION_SITE(
439 "Deposition Site", "deposition_site"), SYNCHROTRON_BEAMLINE(
440 "Synchrotron Beamline", "synchrotron_beamline"), ENTITY_ID(
441 "Entity Id", "entity_id"), BEAM_SOURCE_NAME("Beam Source Name",
442 "beam_source_name"), PROCESSING_SITE("Processing Site",
443 "processing_site"), ENTITY_WEIGHT("Entity Weight",
444 "entity_weight"), VERSION("Version", "_version_"), ALL("ALL",
451 PDBDocField(String name, String code)
457 public String getName()
462 public String getCode()
468 public String toString()