X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=forester%2Fjava%2Fsrc%2Forg%2Fforester%2Fmsa%2FDeleteableMsa.java;h=5126e47634a476dd2a452809d6fcecd2a23bf74d;hb=5642da5f473ab9ae57fee86c0cb3b33525a2e916;hp=da781b87f820060a88ed2b87f289aa5e6240ddd1;hpb=ca9937e02d1d293eee015765ecb8564e563f591c;p=jalview.git diff --git a/forester/java/src/org/forester/msa/DeleteableMsa.java b/forester/java/src/org/forester/msa/DeleteableMsa.java index da781b8..5126e47 100644 --- a/forester/java/src/org/forester/msa/DeleteableMsa.java +++ b/forester/java/src/org/forester/msa/DeleteableMsa.java @@ -27,7 +27,7 @@ package org.forester.msa; import java.util.List; import org.forester.sequence.BasicSequence; -import org.forester.sequence.Sequence; +import org.forester.sequence.MolecularSequence; public final class DeleteableMsa extends BasicMsa { @@ -50,6 +50,38 @@ public final class DeleteableMsa extends BasicMsa { _seqs = msa.getNumberOfSequences(); } + public final double[] calcGappiness() { + final int length = getLength(); + final double gappiness[] = new double[ length ]; + final int seqs = getNumberOfSequences(); + for( int row = 0; row < seqs; ++row ) { + for( int col = 0; col < length; ++col ) { + } + } + return gappiness; + } + + public static int calcGapSumPerColumn( final Msa msa, final int col ) { + int gap_rows = 0; + for( int j = 0; j < msa.getNumberOfSequences(); ++j ) { + if ( msa.isGapAt( j, col ) ) { + gap_rows++; + } + } + return gap_rows; + } + + public short determineMaxIdLength() { + short max = 0; + for( int row = 0; row < getNumberOfSequences(); ++row ) { + final short l = ( short ) getIdentifier( row ).length(); + if ( l > max ) { + max = l; + } + } + return max; + } + final public void deleteGapColumns( final double max_allowed_gap_ratio ) { if ( ( max_allowed_gap_ratio < 0 ) || ( max_allowed_gap_ratio > 1 ) ) { throw new IllegalArgumentException( "max allowed gap ration is out of range: " + max_allowed_gap_ratio ); @@ -64,13 +96,13 @@ public final class DeleteableMsa extends BasicMsa { final public void deleteGapOnlyColumns() { for( int col = getLength() - 1; col >= 0; --col ) { - if ( MsaMethods.calcGapSumPerColumn( this, col ) == getNumberOfSequences() ) { + if ( isAllGap( col ) ) { deleteColumn( col ); } } } - final public void deleteRow( final String id ) { + final public MolecularSequence deleteRow( final String id, final boolean return_removed_seq ) { int row = -1; for( int r = 0; r < getNumberOfSequences(); ++r ) { if ( getIdentifier( r ).equals( id ) ) { @@ -81,7 +113,25 @@ public final class DeleteableMsa extends BasicMsa { if ( row < 0 ) { throw new IllegalArgumentException( "id [" + id + "] not found" ); } + MolecularSequence s = null; + StringBuilder sb = null; + if ( return_removed_seq ) { + s = getSequence( row ); + final char[] x = s.getMolecularSequence(); + sb = new StringBuilder( x.length ); + for( final char element : x ) { + if ( element != MolecularSequence.GAP ) { + sb.append( element ); + } + } + } deleteRow( row ); + if ( return_removed_seq ) { + return new BasicSequence( new String( s.getIdentifier() ), sb.toString(), s.getType() ); + } + else { + return null; + } } @Override @@ -108,11 +158,21 @@ public final class DeleteableMsa extends BasicMsa { } @Override - public Sequence getSequence( final int row ) { + public MolecularSequence getSequence( final int row ) { checkRow( row ); return new BasicSequence( getIdentifier( row ), getSequenceAsString( row ).toString(), getType() ); } + final public boolean isAllGap( final int col ) { + final int m_col = _mapped_col_positions[ col ]; + for( int j = 0; j < getNumberOfSequences(); ++j ) { + if ( super.getResidueAt( _mapped_row_positions[ j ], m_col ) != MolecularSequence.GAP ) { + return false; + } + } + return true; + } + @Override final public void setIdentifier( final int row, final String id ) { checkRow( row ); @@ -140,7 +200,7 @@ public final class DeleteableMsa extends BasicMsa { final private void deleteColumn( final int col ) { checkColumn( col ); - for( int c = col; c < _length - 1; ++c ) { + for( int c = col; c < ( _length - 1 ); ++c ) { _mapped_col_positions[ c ] = _mapped_col_positions[ c + 1 ]; } --_length; @@ -148,13 +208,13 @@ public final class DeleteableMsa extends BasicMsa { final private void deleteRow( final int row ) { checkRow( row ); - for( int r = row; r < _seqs - 1; ++r ) { + for( int r = row; r < ( _seqs - 1 ); ++r ) { _mapped_row_positions[ r ] = _mapped_row_positions[ r + 1 ]; } --_seqs; } - public final static DeleteableMsa createInstance( final List seqs ) { + public final static DeleteableMsa createInstance( final List seqs ) { return new DeleteableMsa( ( BasicMsa ) BasicMsa.createInstance( seqs ) ); }