X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=src%2Fjalview%2Fext%2Fensembl%2FEnsemblFeatures.java;h=99ebc69a0349fa2d2ba1bfe8cc2423ca6fccc69b;hb=dadeab44d8d46ef588e326efb69599baa86a083b;hp=582eac6c2f8c66ccf0ef11e42d13095aee28f288;hpb=f59dd9efbb3dfc313ab0b0507832e21cd0076fe1;p=jalview.git diff --git a/src/jalview/ext/ensembl/EnsemblFeatures.java b/src/jalview/ext/ensembl/EnsemblFeatures.java index 582eac6..99ebc69 100644 --- a/src/jalview/ext/ensembl/EnsemblFeatures.java +++ b/src/jalview/ext/ensembl/EnsemblFeatures.java @@ -22,17 +22,25 @@ package jalview.ext.ensembl; import jalview.datamodel.Alignment; import jalview.datamodel.AlignmentI; -import jalview.io.DataSourceType; -import jalview.io.FeaturesFile; -import jalview.io.FileParse; +import jalview.datamodel.Sequence; +import jalview.datamodel.SequenceFeature; +import jalview.datamodel.SequenceI; +import jalview.io.gff.SequenceOntologyI; +import jalview.util.JSONUtils; import java.io.BufferedReader; import java.io.IOException; import java.net.MalformedURLException; import java.net.URL; import java.util.ArrayList; +import java.util.Iterator; import java.util.List; +import org.json.simple.JSONArray; +import org.json.simple.JSONObject; +import org.json.simple.parser.JSONParser; +import org.json.simple.parser.ParseException; + /** * A client for fetching and processing Ensembl feature data in GFF format by * calling the overlap REST service @@ -91,9 +99,133 @@ class EnsemblFeatures extends EnsemblRestClient { return null; } - FeaturesFile fr = new FeaturesFile( - new FileParse(fp, null, DataSourceType.URL)); - return new Alignment(fr.getSeqsAsArray()); + + SequenceI seq = parseFeaturesJson(fp); + return new Alignment(new SequenceI[] { seq }); + } + + /** + * Parses the JSON response into Jalview sequence features and attaches them + * to a dummy sequence + * + * @param br + * @return + */ + private SequenceI parseFeaturesJson(BufferedReader br) + { + SequenceI seq = new Sequence("Dummy", ""); + + JSONParser jp = new JSONParser(); + try + { + JSONArray responses = (JSONArray) jp.parse(br); + Iterator rvals = responses.iterator(); + while (rvals.hasNext()) + { + try + { + JSONObject obj = (JSONObject) rvals.next(); + String type = obj.get("feature_type").toString(); + int start = Integer.parseInt(obj.get("start").toString()); + int end = Integer.parseInt(obj.get("end").toString()); + String source = obj.get("source").toString(); + String strand = obj.get("strand").toString(); + Object phase = obj.get("phase"); + String alleles = JSONUtils + .arrayToList((JSONArray) obj.get("alleles")); + String clinSig = JSONUtils + .arrayToList( + (JSONArray) obj.get("clinical_significance")); + + /* + * convert 'variation' to 'sequence_variant', and 'cds' to 'CDS' + * so as to have a valid SO term for the feature type + * ('gene', 'exon', 'transcript' don't need any conversion) + */ + if ("variation".equals(type)) + { + type = SequenceOntologyI.SEQUENCE_VARIANT; + } + else if (SequenceOntologyI.CDS.equalsIgnoreCase((type))) + { + type = SequenceOntologyI.CDS; + } + + String desc = getFirstNotNull(obj, "alleles", "external_name", + JSON_ID); + SequenceFeature sf = new SequenceFeature(type, desc, start, end, + source); + sf.setStrand("1".equals(strand) ? "+" : "-"); + if (phase != null) + { + sf.setPhase(phase.toString()); + } + setFeatureAttribute(sf, obj, "id"); + setFeatureAttribute(sf, obj, "Parent"); + setFeatureAttribute(sf, obj, "consequence_type"); + sf.setValue("alleles", alleles); + sf.setValue("clinical_significance", clinSig); + + seq.addSequenceFeature(sf); + } catch (Throwable t) + { + // ignore - keep trying other features + } + } + } catch (ParseException | IOException e) + { + // ignore + } + + return seq; + } + + /** + * Returns the first non-null attribute found (if any) as a string, formatted + * suitably for display as feature description or tooltip. Answers null if + * none of the attribute keys is present. + * + * @param obj + * @param keys + * @return + */ + protected String getFirstNotNull(JSONObject obj, String... keys) + { + String desc = null; + + for (String key : keys) + { + Object val = obj.get(key); + if (val != null) + { + String s = val instanceof JSONArray + ? JSONUtils.arrayToList((JSONArray) val) + : val.toString(); + if (!s.isEmpty()) + { + return s; + } + } + } + return desc; + } + + /** + * A helper method that reads the 'key' entry in the JSON object, and if not + * null, sets its string value as an attribute on the sequence feature + * + * @param sf + * @param obj + * @param key + */ + protected void setFeatureAttribute(SequenceFeature sf, JSONObject obj, + String key) + { + Object object = obj.get(key); + if (object != null) + { + sf.setValue(key, object.toString()); + } } /** @@ -109,7 +241,7 @@ class EnsemblFeatures extends EnsemblRestClient urlstring.append(getDomain()).append("/overlap/id/").append(ids.get(0)); // @see https://github.com/Ensembl/ensembl-rest/wiki/Output-formats - urlstring.append("?content-type=text/x-gff3"); + urlstring.append("?content-type=" + getResponseMimeType()); /* * specify object_type=gene in case is shared by transcript and/or protein; @@ -145,16 +277,16 @@ class EnsemblFeatures extends EnsemblRestClient @Override protected String getRequestMimeType() { - return "text/x-gff3"; + return "application/json"; } /** - * Returns the MIME type for GFF3 + * Returns the MIME type wanted for the response */ @Override protected String getResponseMimeType() { - return "text/x-gff3"; + return "application/json"; } /**