X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=src%2Fjalview%2Fdatamodel%2FAlignment.java;h=04977e852fcd85d83afaee169af0423b76b7468f;hb=797df64fa2a0a30773d0f48f5494d4155e5a8be3;hp=3689433aefcdcba248a8c16fdb0d005f187a436f;hpb=9efc6af45120e24f7a11cc8ce6409139844e5001;p=jalview.git diff --git a/src/jalview/datamodel/Alignment.java b/src/jalview/datamodel/Alignment.java index 3689433..04977e8 100755 --- a/src/jalview/datamodel/Alignment.java +++ b/src/jalview/datamodel/Alignment.java @@ -1,20 +1,19 @@ /* - * Jalview - A Sequence Alignment Editor and Viewer - * Copyright (C) 2007 AM Waterhouse, J Procter, G Barton, M Clamp, S Searle - * - * This program is free software; you can redistribute it and/or - * modify it under the terms of the GNU General Public License - * as published by the Free Software Foundation; either version 2 - * of the License, or (at your option) any later version. - * - * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU General Public License for more details. - * - * You should have received a copy of the GNU General Public License - * along with this program; if not, write to the Free Software - * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA + * Jalview - A Sequence Alignment Editor and Viewer (Version 2.7) + * Copyright (C) 2011 J Procter, AM Waterhouse, J Engelhardt, LM Lui, G Barton, M Clamp, S Searle + * + * This file is part of Jalview. + * + * Jalview is free software: you can redistribute it and/or + * modify it under the terms of the GNU General Public License + * as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. + * + * Jalview is distributed in the hope that it will be useful, but + * WITHOUT ANY WARRANTY; without even the implied warranty + * of MERCHANTABILITY or FITNESS FOR A PARTICULAR + * PURPOSE. See the GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License along with Jalview. If not, see . */ package jalview.datamodel; @@ -22,18 +21,30 @@ import java.util.*; import jalview.analysis.*; -/** Data structure to hold and manipulate a multiple sequence alignment +/** + * Data structure to hold and manipulate a multiple sequence alignment */ -public class Alignment - implements AlignmentI +/** + * @author JimP + * + */ +public class Alignment implements AlignmentI { protected Alignment dataset; + protected Vector sequences; + protected Vector groups = new Vector(); + protected char gapCharacter = '-'; + protected int type = NUCLEOTIDE; + public static final int PROTEIN = 0; + public static final int NUCLEOTIDE = 1; + + public boolean hasRNAStructure = false; /** DOCUMENT ME!! */ public AlignmentAnnotation[] annotations; @@ -64,8 +75,9 @@ public class Alignment } - /** Make an alignment from an array of Sequences. - * + /** + * Make an alignment from an array of Sequences. + * * @param sequences */ public Alignment(SequenceI[] seqs) @@ -75,20 +87,25 @@ public class Alignment /** * Make a new alignment from an array of SeqCigars - * @param seqs SeqCigar[] + * + * @param seqs + * SeqCigar[] */ public Alignment(SeqCigar[] alseqs) { - SequenceI[] seqs = SeqCigar.createAlignmentSequences(alseqs, gapCharacter, - new ColumnSelection(), null); + SequenceI[] seqs = SeqCigar.createAlignmentSequences(alseqs, + gapCharacter, new ColumnSelection(), null); initAlignment(seqs); } /** - * Make a new alignment from an CigarArray - * JBPNote - can only do this when compactAlignment does not contain hidden regions. - * JBPNote - must also check that compactAlignment resolves to a set of SeqCigars - or construct them appropriately. - * @param compactAlignment CigarArray + * Make a new alignment from an CigarArray JBPNote - can only do this when + * compactAlignment does not contain hidden regions. JBPNote - must also check + * that compactAlignment resolves to a set of SeqCigars - or construct them + * appropriately. + * + * @param compactAlignment + * CigarArray */ public static AlignmentI createAlignment(CigarArray compactAlignment) { @@ -98,7 +115,7 @@ public class Alignment /** * DOCUMENT ME! - * + * * @return DOCUMENT ME! */ public Vector getSequences() @@ -108,7 +125,7 @@ public class Alignment public SequenceI[] getSequencesArray() { - if (sequences==null) + if (sequences == null) return null; SequenceI[] reply = new SequenceI[sequences.size()]; for (int i = 0; i < sequences.size(); i++) @@ -120,14 +137,15 @@ public class Alignment /** * DOCUMENT ME! - * - * @param i DOCUMENT ME! - * + * + * @param i + * DOCUMENT ME! + * * @return DOCUMENT ME! */ public SequenceI getSequenceAt(int i) { - if (i < sequences.size()) + if (i>-1 && i < sequences.size()) { return (SequenceI) sequences.elementAt(i); } @@ -135,8 +153,9 @@ public class Alignment return null; } - /** Adds a sequence to the alignment. Recalculates maxLength and size. - * + /** + * Adds a sequence to the alignment. Recalculates maxLength and size. + * * @param snew */ public void addSequence(SequenceI snew) @@ -156,17 +175,22 @@ public class Alignment snew = adding; } } - if (sequences==null) { - initAlignment(new SequenceI[] { snew }); - } else { + if (sequences == null) + { + initAlignment(new SequenceI[] + { snew }); + } + else + { sequences.addElement(snew); } - if (hiddenSequences!=null) + if (hiddenSequences != null) hiddenSequences.adjustHeightSequenceAdded(); } - /** Adds a sequence to the alignment. Recalculates maxLength and size. - * + /** + * Adds a sequence to the alignment. Recalculates maxLength and size. + * * @param snew */ public void setSequenceAt(int i, SequenceI snew) @@ -179,7 +203,7 @@ public class Alignment /** * DOCUMENT ME! - * + * * @return DOCUMENT ME! */ public Vector getGroups() @@ -189,7 +213,7 @@ public class Alignment public void finalize() { - if(getDataset()!=null) + if (getDataset() != null) getDataset().removeAlignmentRef(); dataset = null; @@ -200,11 +224,12 @@ public class Alignment } /** - * decrement the alignmentRefs counter by one and call finalize if it goes to zero. + * decrement the alignmentRefs counter by one and call finalize if it goes to + * zero. */ private void removeAlignmentRef() { - if (--alignmentRefs==0) + if (--alignmentRefs == 0) { finalize(); } @@ -212,8 +237,9 @@ public class Alignment /** * DOCUMENT ME! - * - * @param s DOCUMENT ME! + * + * @param s + * DOCUMENT ME! */ public void deleteSequence(SequenceI s) { @@ -222,8 +248,9 @@ public class Alignment /** * DOCUMENT ME! - * - * @param i DOCUMENT ME! + * + * @param i + * DOCUMENT ME! */ public void deleteSequence(int i) { @@ -252,9 +279,10 @@ public class Alignment /** * DOCUMENT ME! - * - * @param s DOCUMENT ME! - * + * + * @param s + * DOCUMENT ME! + * * @return DOCUMENT ME! */ public SequenceGroup[] findAllGroups(SequenceI s) @@ -317,10 +345,71 @@ public class Alignment } /** - * DOCUMENT ME! + * remove any annotation that references gp + * + * @param gp + * (if null, removes all group associated annotation) */ + private void removeAnnotationForGroup(SequenceGroup gp) + { + if (annotations == null || annotations.length == 0) + { + return; + } + // remove annotation very quickly + AlignmentAnnotation[] t, todelete = new AlignmentAnnotation[annotations.length], tokeep = new AlignmentAnnotation[annotations.length]; + int i, p, k; + if (gp == null) + { + for (i = 0, p = 0, k = 0; i < annotations.length; i++) + { + if (annotations[i].groupRef != null) + { + todelete[p++] = annotations[i]; + } + else + { + tokeep[k++] = annotations[i]; + } + } + } + else + { + for (i = 0, p = 0, k = 0; i < annotations.length; i++) + { + if (annotations[i].groupRef == gp) + { + todelete[p++] = annotations[i]; + } + else + { + tokeep[k++] = annotations[i]; + } + } + } + if (p > 0) + { + // clear out the group associated annotation. + for (i = 0; i < p; i++) + { + unhookAnnotation(todelete[i]); + todelete[i] = null; + } + t = new AlignmentAnnotation[k]; + for (i = 0; i < k; i++) + { + t[i] = tokeep[i]; + } + annotations = t; + } + } + public void deleteAllGroups() { + if (annotations != null) + { + removeAnnotationForGroup(null); + } groups.removeAllElements(); } @@ -329,6 +418,7 @@ public class Alignment { if (groups.contains(g)) { + removeAnnotationForGroup(g); groups.removeElement(g); } } @@ -336,24 +426,54 @@ public class Alignment /** */ public SequenceI findName(String name) { - return findName(name,false); + return findName(name, false); } - /* (non-Javadoc) + /* + * (non-Javadoc) + * * @see jalview.datamodel.AlignmentI#findName(java.lang.String, boolean) */ public SequenceI findName(String token, boolean b) { + return findName(null, token, b); + } + + /* + * (non-Javadoc) + * + * @see jalview.datamodel.AlignmentI#findName(SequenceI, java.lang.String, + * boolean) + */ + public SequenceI findName(SequenceI startAfter, String token, boolean b) + { int i = 0; - SequenceI sq=null; - String sqname=null; + SequenceI sq = null; + String sqname = null; + if (startAfter != null) + { + // try to find the sequence in the alignment + boolean matched = false; + while (i < sequences.size()) + { + if (getSequenceAt(i++) == startAfter) + { + matched = true; + break; + } + } + if (!matched) + { + i = 0; + } + } while (i < sequences.size()) { sq = getSequenceAt(i); sqname = sq.getName(); if (sqname.equals(token) // exact match - || (b && // allow imperfect matches - case varies + || (b && // allow imperfect matches - case varies (sqname.equalsIgnoreCase(token)))) { return getSequenceAt(i); @@ -364,6 +484,7 @@ public class Alignment return null; } + public SequenceI[] findSequenceMatch(String name) { Vector matches = new Vector(); @@ -388,7 +509,11 @@ public class Alignment } - /** */ + /* + * (non-Javadoc) + * + * @see jalview.datamodel.AlignmentI#findIndex(jalview.datamodel.SequenceI) + */ public int findIndex(SequenceI s) { int i = 0; @@ -406,9 +531,30 @@ public class Alignment return -1; } + /* + * (non-Javadoc) + * + * @see + * jalview.datamodel.AlignmentI#findIndex(jalview.datamodel.SearchResults) + */ + public int findIndex(SearchResults results) + { + int i = 0; + + while (i < sequences.size()) + { + if (results.involvesSequence(getSequenceAt(i))) + { + return i; + } + i++; + } + return -1; + } + /** * DOCUMENT ME! - * + * * @return DOCUMENT ME! */ public int getHeight() @@ -418,7 +564,7 @@ public class Alignment /** * DOCUMENT ME! - * + * * @return DOCUMENT ME! */ public int getWidth() @@ -438,8 +584,9 @@ public class Alignment /** * DOCUMENT ME! - * - * @param gc DOCUMENT ME! + * + * @param gc + * DOCUMENT ME! */ public void setGapCharacter(char gc) { @@ -448,17 +595,14 @@ public class Alignment for (int i = 0; i < sequences.size(); i++) { Sequence seq = (Sequence) sequences.elementAt(i); - seq.setSequence(seq.getSequenceAsString() - .replace('.', gc) - .replace('-', gc) - .replace(' ', gc) - ); + seq.setSequence(seq.getSequenceAsString().replace('.', gc) + .replace('-', gc).replace(' ', gc)); } } /** * DOCUMENT ME! - * + * * @return DOCUMENT ME! */ public char getGapCharacter() @@ -466,30 +610,55 @@ public class Alignment return gapCharacter; } - /** - * DOCUMENT ME! - * - * @return DOCUMENT ME! + /* + * (non-Javadoc) + * + * @see jalview.datamodel.AlignmentI#isAligned() */ public boolean isAligned() { - int width = getWidth(); + return isAligned(false); + } + /* + * (non-Javadoc) + * + * @see jalview.datamodel.AlignmentI#isAligned(boolean) + */ + public boolean isAligned(boolean includeHidden) + { + int width = getWidth(); + if (hiddenSequences == null || hiddenSequences.getSize() == 0) + { + includeHidden = true; // no hidden sequences to check against. + } for (int i = 0; i < sequences.size(); i++) { - if (getSequenceAt(i).getLength() != width) + if (includeHidden || !hiddenSequences.isHidden(getSequenceAt(i))) { - return false; + if (getSequenceAt(i).getLength() != width) + { + return false; + } } } return true; } - /* (non-Javadoc) - * @see jalview.datamodel.AlignmentI#deleteAnnotation(jalview.datamodel.AlignmentAnnotation) + + /* + * (non-Javadoc) + * + * @seejalview.datamodel.AlignmentI#deleteAnnotation(jalview.datamodel. + * AlignmentAnnotation) */ public boolean deleteAnnotation(AlignmentAnnotation aa) { + return deleteAnnotation(aa, true); + } + + public boolean deleteAnnotation(AlignmentAnnotation aa, boolean unhook) + { int aSize = 1; if (annotations != null) @@ -504,36 +673,71 @@ public class Alignment AlignmentAnnotation[] temp = new AlignmentAnnotation[aSize - 1]; - boolean swap=false; + boolean swap = false; int tIndex = 0; for (int i = 0; i < aSize; i++) { if (annotations[i] == aa) { - swap=true; + swap = true; continue; } - if (tIndex= aSize) + { + temp[aSize - 1] = aa; + } + else + { + temp[pos] = aa; + } if (aSize > 1) { - for (i = 0; i < (aSize - 1); i++) + int p = 0; + for (i = 0; i < (aSize - 1); i++, p++) { - temp[i] = annotations[i]; + if (p == pos) + { + p++; + } + if (p < temp.length) + { + temp[p] = annotations[i]; + } } } @@ -591,7 +807,7 @@ public class Alignment /** * DOCUMENT ME! - * + * * @return DOCUMENT ME! */ public AlignmentAnnotation[] getAlignmentAnnotation() @@ -622,6 +838,11 @@ public class Alignment return false; } } + + public boolean hasRNAStructure(){ + //TODO can it happen that structure is removed from alignment? + return hasRNAStructure; + } public void setDataset(Alignment data) { @@ -653,10 +874,12 @@ public class Alignment } dataset.addAlignmentRef(); } + /** * reference count for number of alignments referencing this one. */ - int alignmentRefs=0; + int alignmentRefs = 0; + /** * increase reference count to this alignment. */ @@ -674,7 +897,7 @@ public class Alignment { boolean modified = false; - //Remove excess gaps from the end of alignment + // Remove excess gaps from the end of alignment int maxLength = -1; SequenceI current; @@ -683,8 +906,8 @@ public class Alignment current = getSequenceAt(i); for (int j = current.getLength(); j > maxLength; j--) { - if (j > maxLength && !jalview.util.Comparison.isGap( - current.getCharAt(j))) + if (j > maxLength + && !jalview.util.Comparison.isGap(current.getCharAt(j))) { maxLength = j; break; @@ -695,16 +918,14 @@ public class Alignment maxLength++; int cLength; - for (int i = 0; i < sequences.size(); - i++) + for (int i = 0; i < sequences.size(); i++) { current = getSequenceAt(i); cLength = current.getLength(); if (cLength < maxLength) { - current.insertCharAt(cLength, - maxLength - cLength, gapCharacter); + current.insertCharAt(cLength, maxLength - cLength, gapCharacter); modified = true; } else if (current.getLength() > maxLength) @@ -715,6 +936,111 @@ public class Alignment return modified; } + /** + * Justify the sequences to the left or right by deleting and inserting gaps + * before the initial residue or after the terminal residue + * + * @param right + * true if alignment padded to right, false to justify to left + * @return true if alignment was changed + */ + public boolean justify(boolean right) + { + boolean modified = false; + + // Remove excess gaps from the end of alignment + int maxLength = -1; + int ends[] = new int[sequences.size() * 2]; + SequenceI current; + for (int i = 0; i < sequences.size(); i++) + { + current = getSequenceAt(i); + // This should really be a sequence method + ends[i * 2] = current.findIndex(current.getStart()); + ends[i * 2 + 1] = current.findIndex(current.getStart() + + current.getLength()); + boolean hitres = false; + for (int j = 0, rs = 0, ssiz = current.getLength(); j < ssiz; j++) + { + if (!jalview.util.Comparison.isGap(current.getCharAt(j))) + { + if (!hitres) + { + ends[i * 2] = j; + hitres = true; + } + else + { + ends[i * 2 + 1] = j; + if (j - ends[i * 2] > maxLength) + { + maxLength = j - ends[i * 2]; + } + } + } + } + } + + maxLength++; + // now edit the flanking gaps to justify to either left or right + int cLength, extent, diff; + for (int i = 0; i < sequences.size(); i++) + { + current = getSequenceAt(i); + + cLength = 1 + ends[i * 2 + 1] - ends[i * 2]; + diff = maxLength - cLength; // number of gaps to indent + extent = current.getLength(); + if (right) + { + // right justify + if (extent > ends[i * 2 + 1]) + { + current.deleteChars(ends[i * 2 + 1] + 1, extent); + modified = true; + } + if (ends[i * 2] > diff) + { + current.deleteChars(0, ends[i * 2] - diff); + modified = true; + } + else + { + if (ends[i * 2] < diff) + { + current.insertCharAt(0, diff - ends[i * 2], gapCharacter); + modified = true; + } + } + } + else + { + // left justify + if (ends[i * 2] > 0) + { + current.deleteChars(0, ends[i * 2]); + modified = true; + ends[i * 2 + 1] -= ends[i * 2]; + extent -= ends[i * 2]; + } + if (extent > maxLength) + { + current.deleteChars(maxLength + 1, extent); + modified = true; + } + else + { + if (extent < maxLength) + { + current.insertCharAt(extent, maxLength - extent, gapCharacter); + modified = true; + } + } + } + } + return modified; + } + public HiddenSequences getHiddenSequences() { return hiddenSequences; @@ -725,7 +1051,7 @@ public class Alignment SeqCigar alseqs[] = new SeqCigar[sequences.size()]; for (int i = 0; i < sequences.size(); i++) { - alseqs[i] = new SeqCigar( (SequenceI) sequences.elementAt(i)); + alseqs[i] = new SeqCigar((SequenceI) sequences.elementAt(i)); } CigarArray cal = new CigarArray(alseqs); cal.addOperation(CigarArray.M, getWidth()); @@ -734,15 +1060,15 @@ public class Alignment public void setProperty(Object key, Object value) { - if(alignmentProperties==null) + if (alignmentProperties == null) alignmentProperties = new Hashtable(); - alignmentProperties.put(key,value); + alignmentProperties.put(key, value); } public Object getProperty(Object key) { - if(alignmentProperties!=null) + if (alignmentProperties != null) return alignmentProperties.get(key); else return null; @@ -752,26 +1078,35 @@ public class Alignment { return alignmentProperties; } - AlignedCodonFrame[] codonFrameList=null; - /* (non-Javadoc) - * @see jalview.datamodel.AlignmentI#addCodonFrame(jalview.datamodel.AlignedCodonFrame) + + AlignedCodonFrame[] codonFrameList = null; + + /* + * (non-Javadoc) + * + * @see + * jalview.datamodel.AlignmentI#addCodonFrame(jalview.datamodel.AlignedCodonFrame + * ) */ public void addCodonFrame(AlignedCodonFrame codons) { - if (codons==null) + if (codons == null) return; - if (codonFrameList==null) + if (codonFrameList == null) { - codonFrameList = new AlignedCodonFrame[] { codons }; + codonFrameList = new AlignedCodonFrame[] + { codons }; return; } - AlignedCodonFrame[] t = new AlignedCodonFrame[codonFrameList.length+1]; + AlignedCodonFrame[] t = new AlignedCodonFrame[codonFrameList.length + 1]; System.arraycopy(codonFrameList, 0, t, 0, codonFrameList.length); t[codonFrameList.length] = codons; codonFrameList = t; } - /* (non-Javadoc) + /* + * (non-Javadoc) + * * @see jalview.datamodel.AlignmentI#getCodonFrame(int) */ public AlignedCodonFrame getCodonFrame(int index) @@ -779,27 +1114,32 @@ public class Alignment return codonFrameList[index]; } - /* (non-Javadoc) - * @see jalview.datamodel.AlignmentI#getCodonFrame(jalview.datamodel.SequenceI) + /* + * (non-Javadoc) + * + * @see + * jalview.datamodel.AlignmentI#getCodonFrame(jalview.datamodel.SequenceI) */ public AlignedCodonFrame[] getCodonFrame(SequenceI seq) { - if (seq==null || codonFrameList==null) + if (seq == null || codonFrameList == null) return null; - Vector cframes=new Vector(); - for (int f=0;f