From dad8955628659a3478493cc5121311030df20426 Mon Sep 17 00:00:00 2001 From: Jim Procter Date: Sun, 2 Oct 2016 12:26:40 +0100 Subject: [PATCH] JAL-2210 remove ENSEMBL from protein DB list: 1. prevents transcript identifiers being promoted to primary refs on uniprot sequences. 2. obviates the need to add peptide product id to the uniprot sequence. --- src/jalview/datamodel/DBRefSource.java | 2 +- src/jalview/ws/dbsources/Uniprot.java | 22 ++++++++++++++++++++++ 2 files changed, 23 insertions(+), 1 deletion(-) diff --git a/src/jalview/datamodel/DBRefSource.java b/src/jalview/datamodel/DBRefSource.java index 0ac14e5..aef18e9 100755 --- a/src/jalview/datamodel/DBRefSource.java +++ b/src/jalview/datamodel/DBRefSource.java @@ -101,7 +101,7 @@ public class DBRefSource public static final String[] CODINGDBS = { EMBLCDS, GENEDB, ENSEMBL }; public static final String[] PROTEINDBS = { UNIPROT, UNIPROTKB, - EMBLCDSProduct, ENSEMBL }; // Ensembl ENSP* entries are protein + EMBLCDSProduct }; // , ENSEMBL }; // Ensembl ENSP* entries are protein public static String[] allSources() { diff --git a/src/jalview/ws/dbsources/Uniprot.java b/src/jalview/ws/dbsources/Uniprot.java index de70aab..7ecd324 100644 --- a/src/jalview/ws/dbsources/Uniprot.java +++ b/src/jalview/ws/dbsources/Uniprot.java @@ -236,6 +236,28 @@ public class Uniprot extends DbSourceProxyImpl dbRefs.add(dbr); } } + if (false) // "Ensembl".equals(pdb.getType())) + { + /*UniprotXML + * + * + * + * + * + */ + String cdsId = (String) pdb.getProperty() + .get("protein sequence ID"); + if (cdsId != null && cdsId.trim().length() > 0) + { + // Only add the product ID + dbRefs.remove(dbr); + dbr = new DBRefEntry(DBRefSource.ENSEMBL, DBRefSource.UNIPROT + + ":" + dbVersion, cdsId.trim()); + dbRefs.add(dbr); + + } + } + } sequence.setPDBId(onlyPdbEntries); -- 1.7.10.2