/*
* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
* Copyright (C) $$Year-Rel$$ The Jalview Authors
*
* This file is part of Jalview.
*
* Jalview is free software: you can redistribute it and/or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation, either version 3
* of the License, or (at your option) any later version.
*
* Jalview is distributed in the hope that it will be useful, but
* WITHOUT ANY WARRANTY; without even the implied warranty
* of MERCHANTABILITY or FITNESS FOR A PARTICULAR
* PURPOSE. See the GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Jalview. If not, see .
* The Jalview Authors are detailed in the 'AUTHORS' file.
*/
package jalview.datamodel;
import java.util.Hashtable;
import java.util.List;
import java.util.Map;
import java.util.Set;
/**
* Data structure to hold and manipulate a multiple sequence alignment
*/
public interface AlignmentI extends AnnotatedCollectionI
{
/**
* Calculates the number of sequences in an alignment, excluding hidden
* sequences
*
* @return Number of sequences in alignment
*/
int getHeight();
/**
* Calculates the number of sequences in an alignment, including hidden
* sequences
*
* @return Number of sequences in alignment
*/
int getAbsoluteHeight();
/**
*
* Answers the width of the alignment, including gaps, that is, the length of
* the longest sequence, or -1 if there are no sequences. Avoid calling this
* method repeatedly where possible, as it has to perform a calculation. Note
* that this width includes any hidden columns.
*
* @return
* @see AlignmentI#getVisibleWidth()
*/
@Override
int getWidth();
/**
*
* Answers the visible width of the alignment, including gaps, that is, the
* length of the longest sequence, excluding any hidden columns. Answers -1 if
* there are no sequences. Avoid calling this method repeatedly where
* possible, as it has to perform a calculation.
*
* @return
*/
int getVisibleWidth();
/**
* Calculates if this set of sequences (visible and invisible) are all the
* same length
*
* @return true if all sequences in alignment are the same length
*/
boolean isAligned();
/**
* Calculates if this set of sequences is all the same length
*
* @param includeHidden
* optionally exclude hidden sequences from test
* @return true if all (or just visible) sequences are the same length
*/
boolean isAligned(boolean includeHidden);
/**
* Answers if the sequence at alignmentIndex is hidden
*
* @param alignmentIndex
* the index to check
* @return true if the sequence is hidden
*/
boolean isHidden(int alignmentIndex);
/**
* Gets sequences as a Synchronized collection
*
* @return All sequences in alignment.
*/
@Override
List getSequences();
/**
* Gets sequences as a SequenceI[]
*
* @return All sequences in alignment.
*/
SequenceI[] getSequencesArray();
/**
* Find a specific sequence in this alignment.
*
* @param i
* Index of required sequence.
*
* @return SequenceI at given index.
*/
SequenceI getSequenceAt(int i);
/**
* Find a specific sequence in this alignment.
*
* @param i
* Index of required sequence in full alignment, i.e. if all columns
* were visible
*
* @return SequenceI at given index.
*/
SequenceI getSequenceAtAbsoluteIndex(int i);
/**
* Returns a map of lists of sequences keyed by sequence name.
*
* @return
*/
Map> getSequencesByName();
/**
* Add a new sequence to this alignment.
*
* @param seq
* New sequence will be added at end of alignment.
*/
void addSequence(SequenceI seq);
/**
* Used to set a particular index of the alignment with the given sequence.
*
* @param i
* Index of sequence to be updated. if i>length, sequence will be
* added to end, with no intervening positions.
* @param seq
* New sequence to be inserted. The existing sequence at position i
* will be replaced.
* @return existing sequence (or null if i>current length)
*/
SequenceI replaceSequenceAt(int i, SequenceI seq);
/**
* Deletes a sequence from the alignment. Updates hidden sequences to account
* for the removed sequence. Do NOT use this method to delete sequences which
* are just hidden.
*
* @param s
* Sequence to be deleted.
*/
void deleteSequence(SequenceI s);
/**
* Deletes a sequence from the alignment. Updates hidden sequences to account
* for the removed sequence. Do NOT use this method to delete sequences which
* are just hidden.
*
* @param i
* Index of sequence to be deleted.
*/
void deleteSequence(int i);
/**
* Deletes a sequence in the alignment which has been hidden.
*
* @param i
* Index of sequence to be deleted
*/
void deleteHiddenSequence(int i);
/**
* Finds sequence in alignment using sequence name as query.
*
* @param name
* Id of sequence to search for.
*
* @return Sequence matching query, if found. If not found returns null.
*/
SequenceI findName(String name);
SequenceI[] findSequenceMatch(String name);
/**
* Finds index of a given sequence in the alignment.
*
* @param s
* Sequence to look for.
*
* @return Index of sequence within the alignment or -1 if not found
*/
int findIndex(SequenceI s);
/**
* Returns the first group (in the order in which groups were added) that
* includes the given sequence instance and aligned position (base 0), or null
* if none found
*
* @param seq
* - must be contained in the alignment (not a dataset sequence)
* @param position
*
* @return
*/
SequenceGroup findGroup(SequenceI seq, int position);
/**
* Finds all groups that a given sequence is part of.
*
* @param s
* Sequence in alignment.
*
* @return All groups containing given sequence.
*/
SequenceGroup[] findAllGroups(SequenceI s);
/**
* Adds a new SequenceGroup to this alignment.
*
* @param sg
* New group to be added.
*/
void addGroup(SequenceGroup sg);
/**
* Deletes a specific SequenceGroup
*
* @param g
* Group will be deleted from alignment.
*/
void deleteGroup(SequenceGroup g);
/**
* Get all the groups associated with this alignment.
*
* @return All groups as a list.
*/
List getGroups();
/**
* Deletes all groups from this alignment.
*/
void deleteAllGroups();
/**
* Adds a new AlignmentAnnotation to this alignment
*
* @note Care should be taken to ensure that annotation is at least as wide as
* the longest sequence in the alignment for rendering purposes.
*/
void addAnnotation(AlignmentAnnotation aa);
/**
* moves annotation to a specified index in alignment annotation display stack
*
* @param aa
* the annotation object to be moved
* @param index
* the destination position
*/
void setAnnotationIndex(AlignmentAnnotation aa, int index);
/**
* Delete all annotations, including auto-calculated if the flag is set true.
* Returns true if at least one annotation was deleted, else false.
*
* @param includingAutoCalculated
* @return
*/
boolean deleteAllAnnotations(boolean includingAutoCalculated);
/**
* Deletes a specific AlignmentAnnotation from the alignment, and removes its
* reference from any SequenceI or SequenceGroup object's annotation if and
* only if aa is contained within the alignment's annotation vector.
* Otherwise, it will do nothing.
*
* @param aa
* the annotation to delete
* @return true if annotation was deleted from this alignment.
*/
boolean deleteAnnotation(AlignmentAnnotation aa);
/**
* Deletes a specific AlignmentAnnotation from the alignment, and optionally
* removes any reference from any SequenceI or SequenceGroup object's
* annotation if and only if aa is contained within the alignment's annotation
* vector. Otherwise, it will do nothing.
*
* @param aa
* the annotation to delete
* @param unhook
* flag indicating if any references should be removed from
* annotation - use this if you intend to add the annotation back
* into the alignment
* @return true if annotation was deleted from this alignment.
*/
boolean deleteAnnotation(AlignmentAnnotation aa, boolean unhook);
/**
* Get the annotation associated with this alignment (this can be null if no
* annotation has ever been created on the alignment)
*
* @return array of AlignmentAnnotation objects
*/
@Override
AlignmentAnnotation[] getAlignmentAnnotation();
/**
* Change the gap character used in this alignment to 'gc'
*
* @param gc
* the new gap character.
*/
void setGapCharacter(char gc);
/**
* Get the gap character used in this alignment
*
* @return gap character
*/
char getGapCharacter();
/**
* Test if alignment contains RNA structure
*
* @return true if RNA structure AligmnentAnnotation was added to alignment
*/
boolean hasRNAStructure();
/**
* Get the associated dataset for the alignment.
*
* @return Alignment containing dataset sequences or null of this is a
* dataset.
*/
AlignmentI getDataset();
/**
* Set the associated dataset for the alignment, or create one.
*
* @param dataset
* The dataset alignment or null to construct one.
*/
void setDataset(AlignmentI dataset);
/**
* pads sequences with gaps (to ensure the set looks like an alignment)
*
* @return boolean true if alignment was modified
*/
boolean padGaps();
HiddenSequences getHiddenSequences();
HiddenColumns getHiddenColumns();
/**
* Compact representation of alignment
*
* @return CigarArray
*/
CigarArray getCompactAlignment();
/**
* Set an arbitrary key value pair for an alignment. Note: both key and value
* objects should return a meaningful, human readable response to .toString()
*
* @param key
* @param value
*/
void setProperty(Object key, Object value);
/**
* Get a named property from the alignment.
*
* @param key
* @return value of property
*/
Object getProperty(Object key);
/**
* Get the property hashtable.
*
* @return hashtable of alignment properties (or null if none are defined)
*/
Hashtable getProperties();
/**
* add a reference to a frame of aligned codons for this alignment
*
* @param codons
*/
void addCodonFrame(AlignedCodonFrame codons);
/**
* remove a particular codon frame reference from this alignment
*
* @param codons
* @return true if codon frame was removed.
*/
boolean removeCodonFrame(AlignedCodonFrame codons);
/**
* get all codon frames associated with this alignment
*
* @return
*/
List getCodonFrames();
/**
* Set the codon frame mappings (replacing any existing list).
*/
void setCodonFrames(List acfs);
/**
* get codon frames involving sequenceI
*/
List getCodonFrame(SequenceI seq);
/**
* find sequence with given name in alignment
*
* @param token
* name to find
* @param b
* true implies that case insensitive matching will also be
* tried
* @return matched sequence or null
*/
SequenceI findName(String token, boolean b);
/**
* find next sequence with given name in alignment starting after a given
* sequence
*
* @param startAfter
* the sequence after which the search will be started (usually the
* result of the last call to findName)
* @param token
* name to find
* @param b
* true implies that case insensitive matching will also be
* tried
* @return matched sequence or null
*/
SequenceI findName(SequenceI startAfter, String token, boolean b);
/**
* find first sequence in alignment which is involved in the given search
* result object
*
* @param results
* @return -1 or index of sequence in alignment
*/
int findIndex(SearchResultsI results);
/**
* append sequences and annotation from another alignment object to this one.
* Note: this is a straight transfer of object references, and may result in
* toappend's dependent data being transformed to fit the alignment (changing
* gap characters, etc...). If you are uncertain, use the copy Alignment copy
* constructor to create a new version which can be appended without side
* effect.
*
* @param toappend
* - the alignment to be appended.
*/
void append(AlignmentI toappend);
/**
* Justify the sequences to the left or right by deleting and inserting gaps
* before the initial residue or after the terminal residue
*
* @param right
* true if alignment padded to right, false to justify to left
* @return true if alignment was changed TODO: return undo object
*/
boolean justify(boolean right);
/**
* add given annotation row at given position (0 is start, -1 is end)
*
* @param consensus
* @param i
*/
void addAnnotation(AlignmentAnnotation consensus, int i);
/**
* search for or create a specific annotation row on the alignment
*
* @param name
* name for annotation (must match)
* @param calcId
* calcId for the annotation (null or must match)
* @param autoCalc
* - value of autocalc flag for the annotation
* @param seqRef
* - null or specific sequence reference
* @param groupRef
* - null or specific group reference
*
* @return existing annotation matching the given attributes
*/
AlignmentAnnotation findOrCreateAnnotation(String name, String calcId,
boolean autoCalc, SequenceI seqRef, SequenceGroup groupRef);
/**
* like findOrCreateAnnotation - looks for an existing alignment annotation
* row with matching name, calcId, sequenceRef, groupRef and autoCalculated
* flag and updates it from the annotation. If none is found the annotation is
* added directly.
*
* @param ala
* @return ala or the annotation row that was updated.
*/
AlignmentAnnotation updateFromOrCopyAnnotation(AlignmentAnnotation ala);
/**
* move the given group up or down in the alignment by the given number of
* rows. Implementor assumes given group is already present on alignment - no
* recalculations are triggered.
*
* @param sg
* @param map
* @param up
* @param i
*/
void moveSelectedSequencesByOne(SequenceGroup sg,
Map map, boolean up);
/**
* validate annotation after an edit and update any alignment state flags
* accordingly
*
* @param alignmentAnnotation
*/
void validateAnnotation(AlignmentAnnotation alignmentAnnotation);
/**
* Align this alignment the same as the given one. If both of the same type
* (nucleotide/protein) then align both identically. If this is nucleotide and
* the other is protein, make 3 gaps for each gap in the protein sequences. If
* this is protein and the other is nucleotide, insert a gap for each 3 gaps
* (or part thereof) between nucleotide bases. Returns the number of mapped
* sequences that were realigned .
*
* @param al
* @return
*/
int alignAs(AlignmentI al);
/**
* Returns the set of distinct sequence names in the alignment.
*
* @return
*/
Set getSequenceNames();
/**
* Checks if the alignment has at least one sequence with one non-gaped
* residue
*
* @return
*/
public boolean hasValidSequence();
/**
* Update any mappings to 'virtual' sequences to compatible real ones, if
* present in the added sequences. Returns a count of mappings updated.
*
* @param seqs
* @return
*/
int realiseMappings(List seqs);
/**
* Returns the first AlignedCodonFrame that has a mapping between the given
* dataset sequences
*
* @param mapFrom
* @param mapTo
* @return
*/
AlignedCodonFrame getMapping(SequenceI mapFrom, SequenceI mapTo);
/**
* Set the hidden columns collection on the alignment. Answers true if the
* hidden column selection changed, else false.
*
* @param cols
* @return
*/
public boolean setHiddenColumns(HiddenColumns cols);
/**
* Insert a sequence at a position in an alignment
*
* @param i
* The index of the position.
* @param snew
* The new sequence.
*/
void insertSequenceAt(int i, SequenceI snew);
/**
* Set the first sequence as representative and hide its insertions. Typically
* used when loading JPred files.
*/
public void setupJPredAlignment();
/**
* Add gaps into the sequences aligned to profileseq under the given
* AlignmentView
*
* @param profileseq
* sequence in al which sequences are aligned to
* @param input
* alignment view where sequence corresponding to profileseq is first
* entry
* @return new HiddenColumns for new alignment view, with insertions into
* profileseq marked as hidden.
*/
public HiddenColumns propagateInsertions(SequenceI profileseq,
AlignmentView input);
}