X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=forester%2Fjava%2Fsrc%2Forg%2Fforester%2Farchaeopteryx%2FAptxUtil.java;h=89a0cdab49e0065fe99c7c56c7d4711ad2b2c8e8;hb=a3ab1c26605a4ffaaa5e8fd0927250c53c884bf9;hp=0dd82d79cdcf18002575fd02a41d372788c00878;hpb=3d6a64e0371ffedf725bf8467211ed860f298550;p=jalview.git diff --git a/forester/java/src/org/forester/archaeopteryx/AptxUtil.java b/forester/java/src/org/forester/archaeopteryx/AptxUtil.java index 0dd82d7..89a0cda 100644 --- a/forester/java/src/org/forester/archaeopteryx/AptxUtil.java +++ b/forester/java/src/org/forester/archaeopteryx/AptxUtil.java @@ -36,10 +36,12 @@ import java.io.ByteArrayOutputStream; import java.io.File; import java.io.FileNotFoundException; import java.io.IOException; +import java.io.UnsupportedEncodingException; import java.lang.reflect.InvocationTargetException; import java.lang.reflect.Method; import java.net.URI; import java.net.URL; +import java.net.URLEncoder; import java.text.ParseException; import java.util.Arrays; import java.util.HashMap; @@ -73,6 +75,7 @@ import org.forester.io.parsers.tol.TolParser; import org.forester.io.parsers.util.ParserUtils; import org.forester.phylogeny.Phylogeny; import org.forester.phylogeny.PhylogenyMethods; +import org.forester.phylogeny.PhylogenyMethods.DESCENDANT_SORT_PRIORITY; import org.forester.phylogeny.PhylogenyNode; import org.forester.phylogeny.data.Accession; import org.forester.phylogeny.data.BranchColor; @@ -83,7 +86,9 @@ import org.forester.phylogeny.iterators.PhylogenyNodeIterator; import org.forester.phylogeny.iterators.PreorderTreeIterator; import org.forester.util.AsciiHistogram; import org.forester.util.DescriptiveStatistics; +import org.forester.util.ForesterConstants; import org.forester.util.ForesterUtil; +import org.forester.util.SequenceIdParser; import org.forester.ws.seqdb.UniProtTaxonomy; public final class AptxUtil { @@ -98,6 +103,69 @@ public final class AptxUtil { Arrays.sort( AVAILABLE_FONT_FAMILIES_SORTED ); } + public final static String createUriForSeqWeb( final PhylogenyNode node, + final Configuration conf, + final TreePanel tp ) { + String uri_str = null; + final String upkb = ForesterUtil.extractUniProtKbProteinSeqIdentifier( node ); + if ( !ForesterUtil.isEmpty( upkb ) ) { + try { + uri_str = ForesterUtil.UNIPROT_KB + URLEncoder.encode( upkb, ForesterConstants.UTF8 ); + } + catch ( final UnsupportedEncodingException e ) { + showErrorMessage( tp, e.toString() ); + e.printStackTrace(); + } + } + if ( ForesterUtil.isEmpty( uri_str ) ) { + final String v = ForesterUtil.extractGenbankAccessor( node ); + if ( !ForesterUtil.isEmpty( v ) ) { + try { + if ( SequenceIdParser.isProtein( v ) ) { + uri_str = ForesterUtil.NCBI_PROTEIN + URLEncoder.encode( v, ForesterConstants.UTF8 ); + } + else { + uri_str = ForesterUtil.NCBI_NUCCORE + URLEncoder.encode( v, ForesterConstants.UTF8 ); + } + } + catch ( final UnsupportedEncodingException e ) { + showErrorMessage( tp, e.toString() ); + e.printStackTrace(); + } + } + } + if ( ForesterUtil.isEmpty( uri_str ) ) { + final String v = ForesterUtil.extractRefSeqAccessorAccessor( node ); + if ( !ForesterUtil.isEmpty( v ) ) { + try { + if ( SequenceIdParser.isProtein( v ) ) { + uri_str = ForesterUtil.NCBI_PROTEIN + URLEncoder.encode( v, ForesterConstants.UTF8 ); + } + else { + uri_str = ForesterUtil.NCBI_NUCCORE + URLEncoder.encode( v, ForesterConstants.UTF8 ); + } + } + catch ( final UnsupportedEncodingException e ) { + showErrorMessage( tp, e.toString() ); + e.printStackTrace(); + } + } + } + if ( ForesterUtil.isEmpty( uri_str ) ) { + final String v = ForesterUtil.extractGInumber( node ); + if ( !ForesterUtil.isEmpty( v ) ) { + try { + uri_str = ForesterUtil.NCBI_GI + URLEncoder.encode( v, ForesterConstants.UTF8 ); + } + catch ( final UnsupportedEncodingException e ) { + showErrorMessage( tp, e.toString() ); + e.printStackTrace(); + } + } + } + return uri_str; + } + public static MaskFormatter createMaskFormatter( final String s ) { MaskFormatter formatter = null; try { @@ -186,6 +254,36 @@ public final class AptxUtil { } } + public static Set obtainAllDistinctTaxonomies( final PhylogenyNode node ) { + final List descs = node.getAllExternalDescendants(); + final Set tax_set = new HashSet(); + for( final PhylogenyNode n : descs ) { + if ( n.getNodeData().isHasTaxonomy() && !n.getNodeData().getTaxonomy().isEmpty() ) { + tax_set.add( n.getNodeData().getTaxonomy() ); + } + } + return tax_set; + } + + /** + * Returns the set of distinct taxonomies of + * all external nodes of node. + * If at least one the external nodes has no taxonomy, + * null is returned. + * + */ + public static Set obtainDistinctTaxonomies( final PhylogenyNode node ) { + final List descs = node.getAllExternalDescendants(); + final Set tax_set = new HashSet(); + for( final PhylogenyNode n : descs ) { + if ( !n.getNodeData().isHasTaxonomy() || n.getNodeData().getTaxonomy().isEmpty() ) { + return null; + } + tax_set.add( n.getNodeData().getTaxonomy() ); + } + return tax_set; + } + public final static Accession obtainSequenceAccessionFromName( final String sequence_name ) { final String n = sequence_name.trim(); final Matcher matcher1 = seq_identifier_pattern_1.matcher( n ); @@ -494,40 +592,6 @@ public final class AptxUtil { } } - /** - * Returns the set of distinct taxonomies of - * all external nodes of node. - * If at least one the external nodes has no taxonomy, - * null is returned. - * - */ - public static Set obtainDistinctTaxonomies( final PhylogenyNode node ) { - final List descs = node.getAllExternalDescendants(); - final Set tax_set = new HashSet(); - for( final PhylogenyNode n : descs ) { - if ( !n.getNodeData().isHasTaxonomy() || n.getNodeData().getTaxonomy().isEmpty() ) { - return null; - } - tax_set.add( n.getNodeData().getTaxonomy() ); - } - return tax_set; - } - - public static Set obtainAllDistinctTaxonomies( final PhylogenyNode node ) { - final List descs = node.getAllExternalDescendants(); - final Set tax_set = new HashSet(); - for( final PhylogenyNode n : descs ) { - if ( n.getNodeData().isHasTaxonomy() && !n.getNodeData().getTaxonomy().isEmpty() ) { - tax_set.add( n.getNodeData().getTaxonomy() ); - System.out.println( n.getNodeData().getTaxonomy() ); - } - } - for( final Taxonomy taxonomy : tax_set ) { - System.out.println( taxonomy ); - } - return tax_set; - } - final static void collapseSubtree( final PhylogenyNode node, final boolean collapse ) { node.setCollapse( collapse ); if ( node.isExternal() ) { @@ -695,16 +759,19 @@ public final class AptxUtil { desc.append( "Rerootable: " ); desc.append( phy.isRerootable() ); desc.append( "\n" ); - desc.append( "Node sum: " ); + desc.append( "Nodes: " ); desc.append( phy.getNodeCount() ); desc.append( "\n" ); - desc.append( "External node sum: " ); + desc.append( "External nodes: " ); desc.append( phy.getNumberOfExternalNodes() ); desc.append( "\n" ); - desc.append( "Internal node sum: " ); + desc.append( "Internal nodes: " ); desc.append( phy.getNodeCount() - phy.getNumberOfExternalNodes() ); desc.append( "\n" ); - desc.append( "Branche sum: " ); + desc.append( "Internal nodes with polytomies: " ); + desc.append( PhylogenyMethods.countNumberOfPolytomies( phy ) ); + desc.append( "\n" ); + desc.append( "Branches: " ); desc.append( phy.getNumberOfBranches() ); desc.append( "\n" ); desc.append( "Depth: " ); @@ -854,17 +921,6 @@ public final class AptxUtil { return true; } - final static boolean isJava15() { - try { - final String s = ForesterUtil.JAVA_VERSION; - return s.startsWith( "1.5" ); - } - catch ( final Exception e ) { - ForesterUtil.printWarningMessage( Constants.PRG_NAME, "minor error: " + e ); - return false; - } - } - final static boolean isMac() { try { final String s = ForesterUtil.OS_NAME.toLowerCase(); @@ -950,6 +1006,20 @@ public final class AptxUtil { } } + final static void outOfMemoryError( final OutOfMemoryError e ) { + System.err.println(); + System.err.println( "Java memory allocation might be too small, try \"-Xmx2048m\" java command line option" ); + System.err.println(); + e.printStackTrace(); + System.err.println(); + JOptionPane.showMessageDialog( null, + "Java memory allocation might be too small, try \"-Xmx2048m\" java command line option" + + "\n\nError: " + e.getLocalizedMessage(), + "Out of Memory Error [" + Constants.PRG_NAME + " " + Constants.VERSION + "]", + JOptionPane.ERROR_MESSAGE ); + System.exit( -1 ); + } + final static void printAppletMessage( final String applet_name, final String message ) { System.out.println( "[" + applet_name + "] > " + message ); } @@ -958,8 +1028,9 @@ public final class AptxUtil { final boolean phyloxml_validate_against_xsd, final boolean replace_underscores, final boolean internal_numbers_are_confidences, - final TAXONOMY_EXTRACTION taxonomy_extraction ) - throws FileNotFoundException, IOException { + final TAXONOMY_EXTRACTION taxonomy_extraction, + final boolean midpoint_reroot ) throws FileNotFoundException, + IOException { final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance(); final PhylogenyParser parser; boolean nhx_or_nexus = false; @@ -988,6 +1059,12 @@ public final class AptxUtil { PhylogenyMethods.transferInternalNodeNamesToConfidence( phy ); } } + if ( midpoint_reroot ) { + for( final Phylogeny phy : phys ) { + PhylogenyMethods.midpointRoot( phy ); + PhylogenyMethods.orderAppearance( phy.getRoot(), true, true, DESCENDANT_SORT_PRIORITY.NODE_NAME ); + } + } return phys; } @@ -1015,20 +1092,6 @@ public final class AptxUtil { System.exit( -1 ); } - final static void outOfMemoryError( final OutOfMemoryError e ) { - System.err.println(); - System.err.println( "Java memory allocation might be too small, try \"-Xmx2048m\" java command line option" ); - System.err.println(); - e.printStackTrace(); - System.err.println(); - JOptionPane.showMessageDialog( null, - "Java memory allocation might be too small, try \"-Xmx2048m\" java command line option" - + "\n\nError: " + e.getLocalizedMessage(), - "Out of Memory Error [" + Constants.PRG_NAME + " " + Constants.VERSION + "]", - JOptionPane.ERROR_MESSAGE ); - System.exit( -1 ); - } - final static void unexpectedException( final Exception e ) { System.err.println(); e.printStackTrace( System.err );