// / $Id: // FORESTER -- software libraries and applications // for evolutionary biology research and applications. // // Copyright (C) 2014 Christian M. Zmasek // Copyright (C) 2014 Sanford-Burnham Medical Research Institute // All rights reserved // // This library is free software; you can redistribute it and/or // modify it under the terms of the GNU Lesser General Public // License as published by the Free Software Foundation; either // version 2.1 of the License, or (at your option) any later version. // // This library is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU // Lesser General Public License for more details. // // You should have received a copy of the GNU Lesser General Public // License along with this library; if not, write to the Free Software // Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA // // WWW: https://sites.google.com/site/cmzmasek/home/software/forester package org.forester.msa; import java.util.List; import org.forester.sequence.BasicSequence; import org.forester.sequence.Sequence; public final class DeleteableMsa extends BasicMsa { private int _length = 0; private int _mapped_col_positions[] = null; private int _mapped_row_positions[] = null; private int _seqs = 0; private DeleteableMsa( final BasicMsa msa ) { super( msa ); _mapped_col_positions = new int[ msa.getLength() ]; _mapped_row_positions = new int[ msa.getNumberOfSequences() ]; for( int i = 0; i < _mapped_col_positions.length; ++i ) { _mapped_col_positions[ i ] = i; } for( int i = 0; i < _mapped_row_positions.length; ++i ) { _mapped_row_positions[ i ] = i; } _length = msa.getLength(); _seqs = msa.getNumberOfSequences(); } final public void deleteGapColumns( final double max_allowed_gap_ratio ) { if ( ( max_allowed_gap_ratio < 0 ) || ( max_allowed_gap_ratio > 1 ) ) { throw new IllegalArgumentException( "max allowed gap ration is out of range: " + max_allowed_gap_ratio ); } for( int col = getLength() - 1; col >= 0; --col ) { final boolean delete = ( ( double ) MsaMethods.calcGapSumPerColumn( this, col ) / getNumberOfSequences() ) > max_allowed_gap_ratio; if ( delete ) { deleteColumn( col ); } } } final public void deleteGapOnlyColumns() { for( int col = getLength() - 1; col >= 0; --col ) { if ( MsaMethods.calcGapSumPerColumn( this, col ) == getNumberOfSequences() ) { deleteColumn( col ); } } } final public void deleteRow( final String id ) { int row = -1; for( int r = 0; r < getNumberOfSequences(); ++r ) { if ( getIdentifier( r ).equals( id ) ) { row = r; break; } } if ( row < 0 ) { throw new IllegalArgumentException( "id [" + id + "] not found" ); } deleteRow( row ); } @Override final public String getIdentifier( final int row ) { checkRow( row ); return super.getIdentifier( _mapped_row_positions[ row ] ); } @Override final public int getLength() { return _length; } @Override final public int getNumberOfSequences() { return _seqs; } @Override final public char getResidueAt( final int row, final int col ) { checkRow( row ); checkColumn( col ); return super.getResidueAt( _mapped_row_positions[ row ], _mapped_col_positions[ col ] ); } @Override public Sequence getSequence( final int row ) { checkRow( row ); return new BasicSequence( getIdentifier( row ), getSequenceAsString( row ).toString(), getType() ); } @Override final public void setIdentifier( final int row, final String id ) { checkRow( row ); super.setIdentifier( _mapped_row_positions[ row ], id ); } @Override final public void setResidueAt( final int row, final int col, final char residue ) { checkRow( row ); checkColumn( col ); super.setResidueAt( _mapped_row_positions[ row ], _mapped_col_positions[ col ], residue ); } final private void checkColumn( final int col ) { if ( ( col >= _length ) || ( col < 0 ) ) { throw new IllegalArgumentException( "column " + col + " is out of range" ); } } final private void checkRow( final int row ) { if ( ( row >= _seqs ) || ( row < 0 ) ) { throw new IllegalArgumentException( "row " + row + " is out of range" ); } } final private void deleteColumn( final int col ) { checkColumn( col ); for( int c = col; c < _length - 1; ++c ) { _mapped_col_positions[ c ] = _mapped_col_positions[ c + 1 ]; } --_length; } final private void deleteRow( final int row ) { checkRow( row ); for( int r = row; r < _seqs - 1; ++r ) { _mapped_row_positions[ r ] = _mapped_row_positions[ r + 1 ]; } --_seqs; } public final static DeleteableMsa createInstance( final List seqs ) { return new DeleteableMsa( ( BasicMsa ) BasicMsa.createInstance( seqs ) ); } public final static DeleteableMsa createInstance( final Msa msa ) { return new DeleteableMsa( ( BasicMsa ) msa ); } }