/* * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$) * Copyright (C) $$Year-Rel$$ The Jalview Authors * * This file is part of Jalview. * * Jalview is free software: you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation, either version 3 * of the License, or (at your option) any later version. * * Jalview is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty * of MERCHANTABILITY or FITNESS FOR A PARTICULAR * PURPOSE. See the GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with Jalview. If not, see . * The Jalview Authors are detailed in the 'AUTHORS' file. */ package MCview; import jalview.analysis.AlignSeq; import jalview.datamodel.Alignment; import jalview.datamodel.AlignmentAnnotation; import jalview.datamodel.AlignmentI; import jalview.datamodel.PDBEntry; import jalview.datamodel.SequenceI; import jalview.io.AlignFile; import jalview.io.FileParse; import jalview.schemes.ColourSchemeI; import jalview.util.MessageManager; import java.awt.Color; import java.io.IOException; import java.lang.reflect.Constructor; import java.util.ArrayList; import java.util.Hashtable; import java.util.List; import java.util.Vector; public class PDBfile extends AlignFile { private static String CALC_ID_PREFIX = "JalviewPDB"; public Vector chains; public String id; /** * set to true to add derived sequence annotations (temp factor read from * file, or computed secondary structure) to the alignment */ private boolean visibleChainAnnotation = false; /* * Set true to predict secondary structure (using JMol for protein, Annotate3D * for RNA) */ private boolean predictSecondaryStructure = true; /* * Set true (with predictSecondaryStructure=true) to predict secondary * structure using an external service (currently Annotate3D for RNA only) */ private boolean externalSecondaryStructure = false; public PDBfile(boolean addAlignmentAnnotations, boolean predictSecondaryStructure, boolean externalSecStr) { super(); this.visibleChainAnnotation = addAlignmentAnnotations; this.predictSecondaryStructure = predictSecondaryStructure; this.externalSecondaryStructure = externalSecStr; } public PDBfile(boolean addAlignmentAnnotations, boolean predictSecondaryStructure, boolean externalSecStr, String file, String protocol) throws IOException { super(false, file, protocol); this.visibleChainAnnotation = addAlignmentAnnotations; this.predictSecondaryStructure = predictSecondaryStructure; this.externalSecondaryStructure = externalSecStr; doParse(); } public PDBfile(boolean addAlignmentAnnotations, boolean predictSecondaryStructure, boolean externalSecStr, FileParse source) throws IOException { super(false, source); this.visibleChainAnnotation = addAlignmentAnnotations; this.predictSecondaryStructure = predictSecondaryStructure; this.externalSecondaryStructure = externalSecStr; doParse(); } public String print() { return null; } public void parse() throws IOException { // TODO set the filename sensibly - try using data source name. id = safeName(getDataName()); chains = new Vector(); List rna = new ArrayList(); List prot = new ArrayList(); PDBChain tmpchain; String line = null; boolean modelFlag = false; boolean terFlag = false; String lastID = ""; int indexx = 0; String atomnam = null; try { while ((line = nextLine()) != null) { if (line.indexOf("HEADER") == 0) { if (line.length() > 62) { String tid; if (line.length() > 67) { tid = line.substring(62, 67).trim(); } else { tid = line.substring(62).trim(); } if (tid.length() > 0) { id = tid; } continue; } } // Were we to do anything with SEQRES - we start it here if (line.indexOf("SEQRES") == 0) { } if (line.indexOf("MODEL") == 0) { modelFlag = true; } if (line.indexOf("TER") == 0) { terFlag = true; } if (modelFlag && line.indexOf("ENDMDL") == 0) { break; } if (line.indexOf("ATOM") == 0 || (line.indexOf("HETATM") == 0 && !terFlag)) { terFlag = false; // Jalview is only interested in CA bonds???? atomnam = line.substring(12, 15).trim(); if (!atomnam.equals("CA") && !atomnam.equals("P")) { continue; } Atom tmpatom = new Atom(line); tmpchain = findChain(tmpatom.chain); if (tmpchain != null) { if (tmpatom.resNumIns.trim().equals(lastID)) { // phosphorylated protein - seen both CA and P.. continue; } tmpchain.atoms.addElement(tmpatom); } else { tmpchain = new PDBChain(id, tmpatom.chain); chains.addElement(tmpchain); tmpchain.atoms.addElement(tmpatom); } lastID = tmpatom.resNumIns.trim(); } index++; } makeResidueList(); makeCaBondList(); if (id == null) { id = inFile.getName(); } for (PDBChain chain : chains) { SequenceI chainseq = postProcessChain(chain); if (isRNA(chainseq)) { rna.add(chainseq); } else { prot.add(chainseq); } } if (predictSecondaryStructure) { predictSecondaryStructure(rna, prot); } } catch (OutOfMemoryError er) { System.out.println("OUT OF MEMORY LOADING PDB FILE"); throw new IOException( MessageManager .getString("exception.outofmemory_loading_pdb_file")); } catch (NumberFormatException ex) { if (line != null) { System.err.println("Couldn't read number from line:"); System.err.println(line); } } markCalcIds(); } /** * Predict secondary structure for RNA and/or protein sequences and add as * annotations * * @param rnaSequences * @param proteinSequences */ protected void predictSecondaryStructure(List rnaSequences, List proteinSequences) { /* * Currently using Annotate3D for RNA, but only if the 'use external * prediction' flag is set */ if (externalSecondaryStructure && rnaSequences.size() > 0) { try { processPdbFileWithAnnotate3d(rnaSequences); } catch (Exception x) { System.err .println("Exceptions when dealing with RNA in pdb file"); x.printStackTrace(); } } /* * Currently using JMol PDB parser for peptide */ if (proteinSequences.size() > 0) { try { processPdbFileWithJmol(proteinSequences); } catch (Exception x) { System.err .println("Exceptions from Jmol when processing data in pdb file"); x.printStackTrace(); } } } /** * Process a parsed chain to construct and return a Sequence, and add it to * the list of sequences parsed. * * @param chain * @return */ protected SequenceI postProcessChain(PDBChain chain) { SequenceI dataset = chain.sequence; dataset.setName(id + "|" + dataset.getName()); PDBEntry entry = new PDBEntry(); entry.setId(id); entry.setType(PDBEntry.Type.PDB); entry.setProperty(new Hashtable()); if (chain.id != null) { // entry.getProperty().put("CHAIN", chains.elementAt(i).id); entry.setChainCode(String.valueOf(chain.id)); } if (inFile != null) { entry.setFile(inFile.getAbsolutePath()); } else { // TODO: decide if we should dump the datasource to disk entry.setFile(getDataName()); } dataset.addPDBId(entry); // PDBChain objects maintain reference to dataset SequenceI chainseq = dataset.deriveSequence(); seqs.addElement(chainseq); AlignmentAnnotation[] chainannot = chainseq.getAnnotation(); if (chainannot != null && visibleChainAnnotation) { for (int ai = 0; ai < chainannot.length; ai++) { chainannot[ai].visible = visibleChainAnnotation; annotations.addElement(chainannot[ai]); } } return chainseq; } public static boolean isCalcIdHandled(String calcId) { return calcId != null && (CALC_ID_PREFIX.equals(calcId)); } public static boolean isCalcIdForFile(AlignmentAnnotation alan, String pdbFile) { return alan.getCalcId() != null && CALC_ID_PREFIX.equals(alan.getCalcId()) && pdbFile.equals(alan.getProperty("PDBID")); } public static String relocateCalcId(String calcId, Hashtable alreadyLoadedPDB) throws Exception { int s = CALC_ID_PREFIX.length(), end = calcId.indexOf(CALC_ID_PREFIX, s); String between = calcId.substring(s, end - 1); return CALC_ID_PREFIX + alreadyLoadedPDB.get(between) + ":" + calcId.substring(end); } private void markCalcIds() { for (SequenceI sq : seqs) { if (sq.getAnnotation() != null) { for (AlignmentAnnotation aa : sq.getAnnotation()) { String oldId = aa.getCalcId(); if (oldId == null) { oldId = ""; } aa.setCalcId(CALC_ID_PREFIX); aa.setProperty("PDBID", id); aa.setProperty("oldCalcId", oldId); } } } } private void processPdbFileWithJmol(List prot) throws Exception { try { Class cl = Class.forName("jalview.ext.jmol.PDBFileWithJmol"); if (cl != null) { final Constructor constructor = cl.getConstructor(new Class[] { FileParse.class }); final Object[] args = new Object[] { new FileParse(getDataName(), type) }; Object jmf = constructor.newInstance(args); AlignmentI al = new Alignment((SequenceI[]) cl.getMethod( "getSeqsAsArray", new Class[] {}).invoke(jmf)); cl.getMethod("addAnnotations", new Class[] { AlignmentI.class }).invoke(jmf, al); for (SequenceI sq : al.getSequences()) { if (sq.getDatasetSequence() != null) { sq.getDatasetSequence().getPDBId().clear(); } else { sq.getPDBId().clear(); } } replaceAndUpdateChains(prot, al, AlignSeq.PEP, false); } } catch (ClassNotFoundException q) { } } private void replaceAndUpdateChains(List prot, AlignmentI al, String pep, boolean b) { List> replaced = AlignSeq .replaceMatchingSeqsWith(seqs, annotations, prot, al, pep, false); for (PDBChain ch : chains) { int p = 0; for (SequenceI sq : (List) replaced.get(0)) { p++; if (sq == ch.sequence || sq.getDatasetSequence() == ch.sequence) { p = -p; break; } } if (p < 0) { p = -p - 1; // set shadow entry for chains ch.shadow = (SequenceI) replaced.get(1).get(p); ch.shadowMap = ((AlignSeq) replaced.get(2).get(p)) .getMappingFromS1(false); } } } private void processPdbFileWithAnnotate3d(List rna) throws Exception { // System.out.println("this is a PDB format and RNA sequence"); // note: we use reflection here so that the applet can compile and run // without the HTTPClient bits and pieces needed for accessing Annotate3D // web service try { Class cl = Class.forName("jalview.ws.jws1.Annotate3D"); if (cl != null) { // TODO: use the PDB ID of the structure if one is available, to save // bandwidth and avoid uploading the whole structure to the service Object annotate3d = cl.getConstructor(new Class[] {}).newInstance(new Object[] {}); AlignmentI al = ((AlignmentI) cl.getMethod("getRNAMLFor", new Class[] { FileParse.class }).invoke(annotate3d, new Object[] { new FileParse(getDataName(), type) })); for (SequenceI sq : al.getSequences()) { if (sq.getDatasetSequence() != null) { if (sq.getDatasetSequence().getPDBId() != null) { sq.getDatasetSequence().getPDBId().clear(); } } else { if (sq.getPDBId() != null) { sq.getPDBId().clear(); } } } replaceAndUpdateChains(rna, al, AlignSeq.DNA, false); } } catch (ClassNotFoundException x) { // ignore classnotfounds - occurs in applet } ; } /** * make a friendly ID string. * * @param dataName * @return truncated dataName to after last '/' */ private String safeName(String dataName) { int p = 0; while ((p = dataName.indexOf("/")) > -1 && p < dataName.length()) { dataName = dataName.substring(p + 1); } return dataName; } public void makeResidueList() { for (int i = 0; i < chains.size(); i++) { chains.elementAt(i).makeResidueList(visibleChainAnnotation); } } public void makeCaBondList() { for (int i = 0; i < chains.size(); i++) { chains.elementAt(i).makeCaBondList(); } } public PDBChain findChain(String id) { for (int i = 0; i < chains.size(); i++) { if (chains.elementAt(i).id.equals(id)) { return chains.elementAt(i); } } return null; } public void setChargeColours() { for (int i = 0; i < chains.size(); i++) { chains.elementAt(i).setChargeColours(); } } public void setColours(ColourSchemeI cs) { for (int i = 0; i < chains.size(); i++) { chains.elementAt(i).setChainColours(cs); } } public void setChainColours() { for (int i = 0; i < chains.size(); i++) { // divide by zero --> infinity --> 255 ;-) chains.elementAt(i).setChainColours( Color.getHSBColor(1.0f / i, .4f, 1.0f)); } } public static boolean isRNA(SequenceI seq) { for (char c : seq.getSequence()) { if ((c != 'A') && (c != 'C') && (c != 'G') && (c != 'U')) { return false; } } return true; } }