X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=forester%2Fjava%2Fsrc%2Forg%2Fforester%2Ftest%2FTest.java;h=22253df3afaa76cae7255bef54be95b88cff6e4f;hb=e6ea1a1dcb0a9b96cad1bc08c3b80a6f876344d2;hp=4023539191e9fcc887943626d45ff469245db609;hpb=de830ea1bec9c9e224a53c92c9e5a886ee9642f5;p=jalview.git diff --git a/forester/java/src/org/forester/test/Test.java b/forester/java/src/org/forester/test/Test.java index 4023539..22253df 100644 --- a/forester/java/src/org/forester/test/Test.java +++ b/forester/java/src/org/forester/test/Test.java @@ -2,8 +2,8 @@ // FORESTER -- software libraries and applications // for evolutionary biology research and applications. // -// Copyright (C) 2008-2009 Christian M. Zmasek -// Copyright (C) 2008-2009 Burnham Institute for Medical Research +// Copyright (C) 2014 Christian M. Zmasek +// Copyright (C) 2014 Sanford-Burnham Medical Research Institute // All rights reserved // // This library is free software; you can redistribute it and/or @@ -20,7 +20,6 @@ // License along with this library; if not, write to the Free Software // Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA // -// Contact: phylosoft @ gmail . com // WWW: https://sites.google.com/site/cmzmasek/home/software/forester package org.forester.test; @@ -29,6 +28,8 @@ import java.io.ByteArrayInputStream; import java.io.File; import java.io.FileInputStream; import java.io.IOException; +import java.io.StringWriter; +import java.io.Writer; import java.net.URL; import java.util.ArrayList; import java.util.Date; @@ -40,7 +41,9 @@ import java.util.Set; import java.util.SortedSet; import org.forester.application.support_transfer; +import org.forester.archaeopteryx.AptxUtil; import org.forester.archaeopteryx.TreePanelUtil; +import org.forester.archaeopteryx.webservices.WebserviceUtil; import org.forester.development.DevelopmentTools; import org.forester.evoinference.TestPhylogenyReconstruction; import org.forester.evoinference.matrix.character.CharacterStateMatrix; @@ -61,8 +64,10 @@ import org.forester.io.parsers.util.ParserUtils; import org.forester.io.writers.PhylogenyWriter; import org.forester.io.writers.SequenceWriter; import org.forester.msa.BasicMsa; +import org.forester.msa.DeleteableMsa; import org.forester.msa.Mafft; import org.forester.msa.Msa; +import org.forester.msa.Msa.MSA_FORMAT; import org.forester.msa.MsaInferrer; import org.forester.msa.MsaMethods; import org.forester.pccx.TestPccx; @@ -135,6 +140,7 @@ public final class Test { + ForesterUtil.getFileSeparator() + "test_data" + ForesterUtil.getFileSeparator(); private final static boolean PERFORM_DB_TESTS = false; + private static final boolean PERFORM_WEB_TREE_ACCESS = true; private static final String PHYLOXML_LOCAL_XSD = PATH_TO_RESOURCES + "phyloxml_schema/" + ForesterConstants.PHYLO_XML_VERSION + "/" + ForesterConstants.PHYLO_XML_XSD; @@ -175,6 +181,15 @@ public final class Test { System.exit( -1 ); } final long start_time = new Date().getTime(); + System.out.print( "MSA entropy: " ); + if ( Test.testMsaEntropy() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } System.out.print( "Basic node methods: " ); if ( Test.testBasicNodeMethods() ) { System.out.println( "OK." ); @@ -256,31 +271,6 @@ public final class Test { System.out.println( "failed." ); failed++; } - if ( PERFORM_DB_TESTS ) { - System.out.print( "Ebi Entry Retrieval: " ); - if ( Test.testEbiEntryRetrieval() ) { - System.out.println( "OK." ); - succeeded++; - } - else { - System.out.println( "failed." ); - failed++; - } - } - // System.exit( 0 ); - if ( PERFORM_DB_TESTS ) { - System.out.print( "Sequence DB tools 2: " ); - if ( testSequenceDbWsTools2() ) { - System.out.println( "OK." ); - succeeded++; - } - else { - System.out.println( "failed." ); - failed++; - System.exit( -1 ); - } - } - // System.exit( 0 ); System.out.print( "Hmmscan output parser: " ); if ( testHmmscanOutputParser() ) { System.out.println( "OK." ); @@ -290,7 +280,6 @@ public final class Test { System.out.println( "failed." ); failed++; } - // System.out.print( "Overlap removal: " ); if ( !org.forester.test.Test.testOverlapRemoval() ) { System.out.println( "failed." ); @@ -309,7 +298,6 @@ public final class Test { succeeded++; } System.out.println( "OK." ); - // System.out.print( "Taxonomy code extraction: " ); if ( Test.testExtractTaxonomyCodeFromNodeName() ) { System.out.println( "OK." ); @@ -880,29 +868,6 @@ public final class Test { System.out.println( "failed." ); failed++; } - if ( PERFORM_DB_TESTS ) { - System.out.print( "Uniprot Entry Retrieval: " ); - if ( Test.testUniprotEntryRetrieval() ) { - System.out.println( "OK." ); - succeeded++; - } - else { - System.out.println( "failed." ); - failed++; - } - } - if ( PERFORM_DB_TESTS ) { - System.out.print( "Uniprot Taxonomy Search: " ); - if ( Test.testUniprotTaxonomySearch() ) { - System.out.println( "OK." ); - succeeded++; - } - else { - System.out.println( "failed." ); - failed++; - } - } - //---- String path = ""; final String os = ForesterUtil.OS_NAME.toLowerCase(); if ( ( os.indexOf( "mac" ) >= 0 ) && ( os.indexOf( "os" ) > 0 ) ) { @@ -930,7 +895,6 @@ public final class Test { System.out.println( "failed [will not count towards failed tests]" ); } } - //---- System.out.print( "Next nodes with collapsed: " ); if ( Test.testNextNodeWithCollapsing() ) { System.out.println( "OK." ); @@ -949,8 +913,8 @@ public final class Test { System.out.println( "failed." ); failed++; } - System.out.print( "NHX parsing from URL: " ); - if ( Test.testNHXparsingFromURL() ) { + System.out.print( "Deleteable MSA: " ); + if ( Test.testDeleteableMsa() ) { System.out.println( "OK." ); succeeded++; } @@ -958,14 +922,113 @@ public final class Test { System.out.println( "failed." ); failed++; } - System.out.print( "phyloXML parsing from URL: " ); - if ( Test.testPhyloXMLparsingFromURL() ) { - System.out.println( "OK." ); - succeeded++; + if ( PERFORM_DB_TESTS ) { + System.out.print( "Uniprot Entry Retrieval: " ); + if ( Test.testUniprotEntryRetrieval() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } + System.out.print( "Ebi Entry Retrieval: " ); + if ( Test.testEbiEntryRetrieval() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } + System.out.print( "Sequence DB tools 2: " ); + if ( testSequenceDbWsTools2() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + System.exit( -1 ); + } + System.out.print( "Uniprot Taxonomy Search: " ); + if ( Test.testUniprotTaxonomySearch() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } } - else { - System.out.println( "failed." ); - failed++; + if ( PERFORM_WEB_TREE_ACCESS ) { + System.out.print( "NHX parsing from URL: " ); + if ( Test.testNHXparsingFromURL() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } + System.out.print( "NHX parsing from URL 2: " ); + if ( Test.testNHXparsingFromURL2() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } + System.out.print( "phyloXML parsing from URL: " ); + if ( Test.testPhyloXMLparsingFromURL() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } + System.out.print( "TreeBase acccess: " ); + if ( Test.testTreeBaseReading() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } + // + System.out.print( "ToL access: " ); + if ( Test.testToLReading() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } + // + System.out.print( "TreeFam access: " ); + if ( Test.testTreeFamReading() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } + // + // + System.out.print( "Pfam tree access: " ); + if ( Test.testPfamTreeReading() ) { + System.out.println( "OK." ); + succeeded++; + } + else { + System.out.println( "failed." ); + failed++; + } } System.out.println(); final Runtime rt = java.lang.Runtime.getRuntime(); @@ -1084,13 +1147,63 @@ public final class Test { return true; } - public static final boolean testPhyloXMLparsingFromURL() { + public static final boolean testNHXparsingFromURL2() { try { - final String s = "https://sites.google.com/site/cmzmasek/home/software/archaeopteryx/examples/archaeopteryx_a/apaf_bcl2.xml"; - final URL u = new URL( s ); - final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance(); - final Phylogeny[] phys = factory.create( u.openStream(), PhyloXmlParser.createPhyloXmlParser() ); - if ( ( phys == null ) || ( phys.length != 2 ) ) { + final String s = "https://sites.google.com/site/cmzmasek/home/software/archaeopteryx/examples/simple/simple_1.nh"; + final Phylogeny phys[] = AptxUtil.readPhylogeniesFromUrl( new URL( s ), + false, + false, + false, + TAXONOMY_EXTRACTION.NO, + false ); + if ( ( phys == null ) || ( phys.length != 5 ) ) { + return false; + } + if ( !phys[ 0 ].toNewHampshire().equals( "((((A,B),C),D),(E,F));" ) ) { + System.out.println( phys[ 0 ].toNewHampshire() ); + return false; + } + if ( !phys[ 1 ].toNewHampshire().equals( "((1,2,3),(4,5,6),(7,8,9));" ) ) { + System.out.println( phys[ 1 ].toNewHampshire() ); + return false; + } + final Phylogeny phys2[] = AptxUtil.readPhylogeniesFromUrl( new URL( s ), + false, + false, + false, + TAXONOMY_EXTRACTION.NO, + false ); + if ( ( phys2 == null ) || ( phys2.length != 5 ) ) { + return false; + } + if ( !phys2[ 0 ].toNewHampshire().equals( "((((A,B),C),D),(E,F));" ) ) { + System.out.println( phys2[ 0 ].toNewHampshire() ); + return false; + } + if ( !phys2[ 1 ].toNewHampshire().equals( "((1,2,3),(4,5,6),(7,8,9));" ) ) { + System.out.println( phys2[ 1 ].toNewHampshire() ); + return false; + } + final Phylogeny phys3[] = AptxUtil.readPhylogeniesFromUrl( new URL( "http://swisstree.vital-it.ch:80/" + + "SwissTree/ST001/consensus_tree.nhx" ), false, false, false, TAXONOMY_EXTRACTION.NO, false ); + if ( ( phys3 == null ) || ( phys3.length != 1 ) ) { + return false; + } + if ( !phys3[ 0 ] + .toNewHampshire() + .equals( "((((POP23a_CIOIN_ENSCING00000016202,POP23b_CIOIN_ENSCING00000016169),POP23_CIOSA_ENSCSAVG00000000248),((POP23a_BRAFL_C3ZMF1,POP23b_BRAFL_121417),(((POP3_ORYLA_ENSORLG00000019669,POP3_GASAC_ENSGACG00000014023,POP3_DANRE_Q6JWW1),(POP3_XENTR_B1H1F6,(POP3_CHICK_Q9DG25,(POP3_ORNAN_ENSOANG00000004179,POP3_MONDO_ENSMODG00000018033,((POP3_MOUSE_Q9ES81,POP3_RAT_Q3BCU3),POP3_RABIT_ENSOCUG00000025973,POP3_MACMU_ENSMMUG00000014473,POP3_HUMAN_Q9HBV1))))),(((POP2_GASAC_ENSGACG00000001420,POP2_ORYLA_ENSORLG00000008627,POP2_TAKRU_ENSTRUG00000015933),POP2_DANRE_ENSDARG00000069922),POP2_XENTR_ENSXETG00000018064,(((POP2_TAEGU_ENSTGUG00000013383,POP2_CHICK_Q6T9Z5),POP2_ANOCA_ENSACAG00000003557),((POP2_MACEU_ENSMEUG00000015825,POP2_MONDO_ENSMODG00000018205),((POP2_RABIT_ENSOCUG00000009515,(POP2_RAT_Q6P722,POP2_MOUSE_Q9ES82)),(POP2_MACMU_ENSMMUG00000000905,POP2_HUMAN_Q9HBU9)))))))),((POP1_CIOSA_ENSCSAVG00000000247,POP1_CIOIN_ENSCING00000000496),((POP1_DANRE_Q5PQZ7,(POP1_ORYLA_ENSORLG00000019663,POP1_GASAC_ENSGACG00000014015,POP1_TAKRU_ENSORLG00000019663)),(POP1_XENTR_B1H1G2,(POP1_ANOCA_ENSACAG00000003910,(POP1_TAEGU_ENSTGUG00000012218,POP1_CHICK_Q9DG23)),POP1_ORNAN_ENSOANG00000004180,POP1_MONDO_ENSMODG00000018034,(POP1_RABIT_ENSOCUG00000016944,(POP1_RAT_Q3BCU4,POP1_MOUSE_Q9ES83),(POP1_HUMAN_Q8NE79,POP1_MACMU_ENSMMUG00000014471))))));" ) ) { + System.out.println( phys3[ 0 ].toNewHampshire() ); + return false; + } + final Phylogeny phys4[] = AptxUtil.readPhylogeniesFromUrl( new URL( "http://swisstree.vital-it.ch:80/" + + "SwissTree/ST001/consensus_tree.nhx" ), false, false, false, TAXONOMY_EXTRACTION.NO, false ); + if ( ( phys4 == null ) || ( phys4.length != 1 ) ) { + return false; + } + if ( !phys4[ 0 ] + .toNewHampshire() + .equals( "((((POP23a_CIOIN_ENSCING00000016202,POP23b_CIOIN_ENSCING00000016169),POP23_CIOSA_ENSCSAVG00000000248),((POP23a_BRAFL_C3ZMF1,POP23b_BRAFL_121417),(((POP3_ORYLA_ENSORLG00000019669,POP3_GASAC_ENSGACG00000014023,POP3_DANRE_Q6JWW1),(POP3_XENTR_B1H1F6,(POP3_CHICK_Q9DG25,(POP3_ORNAN_ENSOANG00000004179,POP3_MONDO_ENSMODG00000018033,((POP3_MOUSE_Q9ES81,POP3_RAT_Q3BCU3),POP3_RABIT_ENSOCUG00000025973,POP3_MACMU_ENSMMUG00000014473,POP3_HUMAN_Q9HBV1))))),(((POP2_GASAC_ENSGACG00000001420,POP2_ORYLA_ENSORLG00000008627,POP2_TAKRU_ENSTRUG00000015933),POP2_DANRE_ENSDARG00000069922),POP2_XENTR_ENSXETG00000018064,(((POP2_TAEGU_ENSTGUG00000013383,POP2_CHICK_Q6T9Z5),POP2_ANOCA_ENSACAG00000003557),((POP2_MACEU_ENSMEUG00000015825,POP2_MONDO_ENSMODG00000018205),((POP2_RABIT_ENSOCUG00000009515,(POP2_RAT_Q6P722,POP2_MOUSE_Q9ES82)),(POP2_MACMU_ENSMMUG00000000905,POP2_HUMAN_Q9HBU9)))))))),((POP1_CIOSA_ENSCSAVG00000000247,POP1_CIOIN_ENSCING00000000496),((POP1_DANRE_Q5PQZ7,(POP1_ORYLA_ENSORLG00000019663,POP1_GASAC_ENSGACG00000014015,POP1_TAKRU_ENSORLG00000019663)),(POP1_XENTR_B1H1G2,(POP1_ANOCA_ENSACAG00000003910,(POP1_TAEGU_ENSTGUG00000012218,POP1_CHICK_Q9DG23)),POP1_ORNAN_ENSOANG00000004180,POP1_MONDO_ENSMODG00000018034,(POP1_RABIT_ENSOCUG00000016944,(POP1_RAT_Q3BCU4,POP1_MOUSE_Q9ES83),(POP1_HUMAN_Q8NE79,POP1_MACMU_ENSMMUG00000014471))))));" ) ) { + System.out.println( phys4[ 0 ].toNewHampshire() ); return false; } } @@ -1319,6 +1432,115 @@ public final class Test { return true; } + public static final boolean testPfamTreeReading() { + try { + final URL u = new URL( WebserviceUtil.PFAM_SERVER + "/family/PF" + "01849" + "/tree/download" ); + final NHXParser parser = new NHXParser(); + parser.setTaxonomyExtraction( NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_STRICT ); + parser.setReplaceUnderscores( false ); + parser.setGuessRootedness( true ); + final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance(); + final Phylogeny[] phys = factory.create( u.openStream(), parser ); + if ( ( phys == null ) || ( phys.length != 1 ) ) { + return false; + } + if ( phys[ 0 ].getNumberOfExternalNodes() < 10 ) { + return false; + } + } + catch ( final Exception e ) { + e.printStackTrace(); + } + return true; + } + + public static final boolean testPhyloXMLparsingFromURL() { + try { + final String s = "https://sites.google.com/site/cmzmasek/home/software/archaeopteryx/examples/archaeopteryx_a/apaf_bcl2.xml"; + final URL u = new URL( s ); + final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance(); + final Phylogeny[] phys = factory.create( u.openStream(), PhyloXmlParser.createPhyloXmlParser() ); + if ( ( phys == null ) || ( phys.length != 2 ) ) { + return false; + } + } + catch ( final Exception e ) { + e.printStackTrace(); + } + return true; + } + + public static final boolean testToLReading() { + try { + final URL u = new URL( WebserviceUtil.TOL_URL_BASE + "15079" ); + final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance(); + final Phylogeny[] phys = factory.create( u.openStream(), new TolParser() ); + if ( ( phys == null ) || ( phys.length != 1 ) ) { + return false; + } + if ( !phys[ 0 ].getRoot().getNodeData().getTaxonomy().getIdentifier().getValue().equals( "15079" ) ) { + return false; + } + if ( !phys[ 0 ].getRoot().getNodeData().getTaxonomy().getScientificName().equals( "Protacanthopterygii" ) ) { + return false; + } + if ( phys[ 0 ].getNumberOfExternalNodes() < 5 ) { + return false; + } + } + catch ( final Exception e ) { + e.printStackTrace(); + } + return true; + } + + public static final boolean testTreeBaseReading() { + try { + final URL u = new URL( WebserviceUtil.TREEBASE_PHYLOWS_TREE_URL_BASE + "825?format=nexus" ); + final NexusPhylogeniesParser parser = new NexusPhylogeniesParser(); + parser.setReplaceUnderscores( true ); + final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance(); + final Phylogeny[] phys = factory.create( u.openStream(), parser ); + if ( ( phys == null ) || ( phys.length != 1 ) ) { + return false; + } + final URL u2 = new URL( WebserviceUtil.TREEBASE_PHYLOWS_STUDY_URL_BASE + "15613?format=nexus" ); + final NexusPhylogeniesParser parser2 = new NexusPhylogeniesParser(); + parser2.setReplaceUnderscores( true ); + final PhylogenyFactory factory2 = ParserBasedPhylogenyFactory.getInstance(); + final Phylogeny[] phys2 = factory2.create( u2.openStream(), parser2 ); + if ( ( phys2 == null ) || ( phys2.length != 9 ) ) { + return false; + } + } + catch ( final Exception e ) { + e.printStackTrace(); + } + return true; + } + + public static final boolean testTreeFamReading() { + try { + final URL u = new URL( WebserviceUtil.TREE_FAM_URL_BASE + "101004" + "/tree/newick" ); + final NHXParser parser = new NHXParser(); + parser.setTaxonomyExtraction( NHXParser.TAXONOMY_EXTRACTION.NO ); + parser.setReplaceUnderscores( false ); + parser.setGuessRootedness( true ); + final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance(); + final Phylogeny[] phys = factory.create( u.openStream(), parser ); + if ( ( phys == null ) || ( phys.length != 1 ) ) { + return false; + } + if ( phys[ 0 ].getNumberOfExternalNodes() < 10 ) { + return false; + } + } + catch ( final Exception e ) { + e.printStackTrace(); + } + return true; + } + private final static Phylogeny createPhylogeny( final String nhx ) throws IOException { final Phylogeny p = ParserBasedPhylogenyFactory.getInstance().create( nhx, new NHXParser() )[ 0 ]; return p; @@ -3342,7 +3564,7 @@ public final class Test { if ( t4.getNumberOfExternalNodes() != 5 ) { return false; } - String s = w.toNewHampshire( t4, false, true ).toString(); + String s = w.toNewHampshire( t4, true ).toString(); if ( !s.equals( "((A,(B11,B12)),(C,D));" ) ) { return false; } @@ -3363,7 +3585,7 @@ public final class Test { if ( !n.getName().equals( "D" ) ) { return false; } - s = w.toNewHampshire( t4, false, true ).toString(); + s = w.toNewHampshire( t4, true ).toString(); if ( !s.equals( "((A,B12),D);" ) ) { return false; } @@ -3372,7 +3594,7 @@ public final class Test { if ( t5.getNumberOfExternalNodes() != 5 ) { return false; } - s = w.toNewHampshire( t5, false, true ).toString(); + s = w.toNewHampshire( t5, true ).toString(); if ( !s.equals( "(((B11,B12),B2),(C,D));" ) ) { return false; } @@ -3381,7 +3603,7 @@ public final class Test { if ( t6.getNumberOfExternalNodes() != 5 ) { return false; } - s = w.toNewHampshire( t6, false, false ).toString(); + s = w.toNewHampshire( t6, false ).toString(); if ( !s.equals( "((A,(B12,B2)),(C,D));" ) ) { return false; } @@ -3390,7 +3612,7 @@ public final class Test { if ( t7.getNumberOfExternalNodes() != 5 ) { return false; } - s = w.toNewHampshire( t7, false, true ).toString(); + s = w.toNewHampshire( t7, true ).toString(); if ( !s.equals( "((A,(B11,B2)),(C,D));" ) ) { return false; } @@ -3399,7 +3621,7 @@ public final class Test { if ( t8.getNumberOfExternalNodes() != 5 ) { return false; } - s = w.toNewHampshire( t8, false, false ).toString(); + s = w.toNewHampshire( t8, false ).toString(); if ( !s.equals( "((A,(B11,B12)),(C,D));" ) ) { return false; } @@ -3408,7 +3630,7 @@ public final class Test { if ( t9.getNumberOfExternalNodes() != 5 ) { return false; } - s = w.toNewHampshire( t9, false, true ).toString(); + s = w.toNewHampshire( t9, true ).toString(); if ( !s.equals( "((A,((B11,B12),B2)),D);" ) ) { return false; } @@ -3417,7 +3639,7 @@ public final class Test { if ( t10.getNumberOfExternalNodes() != 5 ) { return false; } - s = w.toNewHampshire( t10, false, true ).toString(); + s = w.toNewHampshire( t10, true ).toString(); if ( !s.equals( "((A,((B11,B12),B2)),C);" ) ) { return false; } @@ -3426,7 +3648,7 @@ public final class Test { if ( t11.getNumberOfExternalNodes() != 2 ) { return false; } - s = w.toNewHampshire( t11, false, true ).toString(); + s = w.toNewHampshire( t11, true ).toString(); if ( !s.equals( "(B,C);" ) ) { return false; } @@ -3434,7 +3656,7 @@ public final class Test { if ( t11.getNumberOfExternalNodes() != 1 ) { return false; } - s = w.toNewHampshire( t11, false, false ).toString(); + s = w.toNewHampshire( t11, false ).toString(); if ( !s.equals( "B;" ) ) { return false; } @@ -3443,7 +3665,7 @@ public final class Test { if ( t12.getNumberOfExternalNodes() != 8 ) { return false; } - s = w.toNewHampshire( t12, false, true ).toString(); + s = w.toNewHampshire( t12, true ).toString(); if ( !s.equals( "((A1,A2,A3),(B1,B3),(C1,C2,C3));" ) ) { return false; } @@ -3451,7 +3673,7 @@ public final class Test { if ( t12.getNumberOfExternalNodes() != 7 ) { return false; } - s = w.toNewHampshire( t12, false, true ).toString(); + s = w.toNewHampshire( t12, true ).toString(); if ( !s.equals( "((A1,A2,A3),B1,(C1,C2,C3));" ) ) { return false; } @@ -3459,7 +3681,7 @@ public final class Test { if ( t12.getNumberOfExternalNodes() != 6 ) { return false; } - s = w.toNewHampshire( t12, false, true ).toString(); + s = w.toNewHampshire( t12, true ).toString(); if ( !s.equals( "((A1,A2,A3),B1,(C1,C2));" ) ) { return false; } @@ -3467,7 +3689,7 @@ public final class Test { if ( t12.getNumberOfExternalNodes() != 5 ) { return false; } - s = w.toNewHampshire( t12, false, true ).toString(); + s = w.toNewHampshire( t12, true ).toString(); if ( !s.equals( "((A2,A3),B1,(C1,C2));" ) ) { return false; } @@ -3475,7 +3697,7 @@ public final class Test { if ( t12.getNumberOfExternalNodes() != 4 ) { return false; } - s = w.toNewHampshire( t12, false, true ).toString(); + s = w.toNewHampshire( t12, true ).toString(); if ( !s.equals( "((A2,A3),(C1,C2));" ) ) { return false; } @@ -3483,7 +3705,7 @@ public final class Test { if ( t12.getNumberOfExternalNodes() != 3 ) { return false; } - s = w.toNewHampshire( t12, false, true ).toString(); + s = w.toNewHampshire( t12, true ).toString(); if ( !s.equals( "(A2,(C1,C2));" ) ) { return false; } @@ -3491,7 +3713,7 @@ public final class Test { if ( t12.getNumberOfExternalNodes() != 2 ) { return false; } - s = w.toNewHampshire( t12, false, true ).toString(); + s = w.toNewHampshire( t12, true ).toString(); if ( !s.equals( "(C1,C2);" ) ) { return false; } @@ -3500,7 +3722,7 @@ public final class Test { if ( t13.getNumberOfExternalNodes() != 4 ) { return false; } - s = w.toNewHampshire( t13, false, true ).toString(); + s = w.toNewHampshire( t13, true ).toString(); if ( !s.equals( "(A,B,C,E:5.0);" ) ) { return false; } @@ -3509,7 +3731,7 @@ public final class Test { if ( t14.getNumberOfExternalNodes() != 5 ) { return false; } - s = w.toNewHampshire( t14, false, true ).toString(); + s = w.toNewHampshire( t14, true ).toString(); if ( !s.equals( "((A,B,C,D:1.1),F);" ) ) { return false; } @@ -4051,29 +4273,233 @@ public final class Test { if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2_Mus_musculus" ).equals( "Mus musculus" ) ) { return false; } - if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2_Mus_musculus_musculus" ) - .equals( "Mus musculus musculus" ) ) { + if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2 Mus musculus" ).equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_BCDO2" ).equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus musculus musculus BCDO2" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_BCDO2" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2 Mus musculus musculus" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Bcl Mus musculus musculus" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( ParserUtils.extractScientificNameFromNodeName( "vcl Mus musculus musculus" ) != null ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "could_be_anything_Mus_musculus_musculus_BCDO2" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "could_be_anything_Mus_musculus_musculus_Musculus" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( ParserUtils.extractScientificNameFromNodeName( "could_be_anything_Mus_musculus_musculus_musculus" ) != null ) { + return false; + } + if ( ParserUtils.extractScientificNameFromNodeName( "musculus" ) != null ) { + return false; + } + if ( ParserUtils.extractScientificNameFromNodeName( "mus_musculus" ) != null ) { + return false; + } + if ( ParserUtils.extractScientificNameFromNodeName( "mus_musculus_musculus" ) != null ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_1" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_1" ).equals( "Mus musculus" ) ) { + return false; + } + if ( ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_bcl" ) != null ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_BCL" ).equals( "Mus musculus" ) ) { + return false; + } + if ( ParserUtils.extractScientificNameFromNodeName( "Mus musculus bcl" ) != null ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus musculus BCL" ).equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus musculus xBCL" ).equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus musculus x1" ).equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( " -XS12_Mus_musculus_12" ).equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( " -1234_Mus_musculus_12 affrre e" ) + .equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( " -1234_Mus_musculus_12_affrre_e" ) + .equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus" ).equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_2bcl2" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_2bcl2" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_bcl2" ) + .equals( "Mus musculus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_123" ).equals( "Mus musculus" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Pilostyles mexicana Mexico Breedlove 27233" ) + .equals( "Pilostyles mexicana" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia_coli_strain_K12/DH10B" ) + .equals( "Escherichia coli strain K12/DH10B" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia_coli_str_K12/DH10B" ) + .equals( "Escherichia coli str. K12/DH10B" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli str. K12/DH10B" ) + .equals( "Escherichia coli str. K12/DH10B" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis_lyrata_subsp_lyrata" ) + .equals( "Arabidopsis lyrata subsp. lyrata" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subsp. lyrata" ) + .equals( "Arabidopsis lyrata subsp. lyrata" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subsp. lyrata 395" ) + .equals( "Arabidopsis lyrata subsp. lyrata" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subsp. lyrata bcl2" ) + .equals( "Arabidopsis lyrata subsp. lyrata" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subsp lyrata bcl2" ) + .equals( "Arabidopsis lyrata subsp. lyrata" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subspecies lyrata bcl2" ) + .equals( "Arabidopsis lyrata subspecies lyrata" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Verbascum sinuatum var. adenosepalum bcl2" ) + .equals( "Verbascum sinuatum var. adenosepalum" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (strain K12)" ) + .equals( "Escherichia coli (strain K12)" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (strain K12) bcl2" ) + .equals( "Escherichia coli (strain K12)" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (str. K12)" ) + .equals( "Escherichia coli (str. K12)" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (str K12)" ) + .equals( "Escherichia coli (str. K12)" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (str. K12) bcl2" ) + .equals( "Escherichia coli (str. K12)" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (var K12) bcl2" ) + .equals( "Escherichia coli (var. K12)" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli str. K-12 substr. MG1655star" ) + .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli str K-12 substr MG1655star" ) + .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) { + return false; + } + if ( !ParserUtils + .extractScientificNameFromNodeName( "could be anything Escherichia coli str K-12 substr MG1655star" ) + .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli str K-12 substr MG1655star gene1" ) + .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) { + return false; + } + if ( !ParserUtils + .extractScientificNameFromNodeName( "could be anything Escherichia coli str K-12 substr MG1655star GENE1" ) + .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia_coli_str_K-12_substr_MG1655star" ) + .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) { return false; } - if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2_Mus_musculus_musculus-12" ) - .equals( "Mus musculus musculus" ) ) { + if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia_coli_str_K-12_substr_MG1655star" ) + .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) { return false; } - if ( !ParserUtils.extractScientificNameFromNodeName( " -XS12_Mus_musculus-12" ).equals( "Mus musculus" ) ) { + if ( !ParserUtils.extractScientificNameFromNodeName( "Macrocera sp." ).equals( "Macrocera sp." ) ) { return false; } - if ( !ParserUtils.extractScientificNameFromNodeName( " -1234_Mus_musculus-12 affrre e" ) - .equals( "Mus musculus" ) ) { + if ( !ParserUtils.extractScientificNameFromNodeName( "Macrocera sp. 123" ).equals( "Macrocera sp." ) ) { return false; } - if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus" ).equals( "Mus musculus" ) ) { + if ( !ParserUtils.extractScientificNameFromNodeName( "Macrocera sp. K12" ).equals( "Macrocera sp." ) ) { return false; } - if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus" ) - .equals( "Mus musculus musculus" ) ) { + if ( !ParserUtils.extractScientificNameFromNodeName( "something Macrocera sp. K12" ) + .equals( "Macrocera sp." ) ) { return false; } - if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_123" ).equals( "Mus musculus" ) ) { + if ( !ParserUtils.extractScientificNameFromNodeName( "Macrocera sp" ).equals( "Macrocera sp." ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Sesamum rigidum ssp merenskyanum 07 48" ) + .equals( "Sesamum rigidum subsp. merenskyanum" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Sesamum rigidum ssp. merenskyanum" ) + .equals( "Sesamum rigidum subsp. merenskyanum" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Sesamum rigidum (ssp. merenskyanum)" ) + .equals( "Sesamum rigidum (subsp. merenskyanum)" ) ) { + return false; + } + if ( !ParserUtils.extractScientificNameFromNodeName( "Sesamum rigidum (ssp merenskyanum)" ) + .equals( "Sesamum rigidum (subsp. merenskyanum)" ) ) { return false; } } @@ -5747,6 +6173,228 @@ public final class Test { return true; } + private static boolean testMsaEntropy() { + try { + final Sequence s0 = BasicSequence.createAaSequence( "a", "AAAAAAA" ); + final Sequence s1 = BasicSequence.createAaSequence( "b", "AAAIACC" ); + final Sequence s2 = BasicSequence.createAaSequence( "c", "AAIIIIF" ); + final Sequence s3 = BasicSequence.createAaSequence( "d", "AIIIVVW" ); + final List l = new ArrayList(); + l.add( s0 ); + l.add( s1 ); + l.add( s2 ); + l.add( s3 ); + final Msa msa = BasicMsa.createInstance( l ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 0 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 1 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 2 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 3 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 4 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 5 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 6 ) ); + System.out.println(); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 0 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 1 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 2 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 3 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 4 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 5 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 6 ) ); + final List l2 = new ArrayList(); + l2.add( BasicSequence.createAaSequence( "1", "AAAAAAA" ) ); + l2.add( BasicSequence.createAaSequence( "2", "AAAIACC" ) ); + l2.add( BasicSequence.createAaSequence( "3", "AAIIIIF" ) ); + l2.add( BasicSequence.createAaSequence( "4", "AIIIVVW" ) ); + l2.add( BasicSequence.createAaSequence( "5", "AAAAAAA" ) ); + l2.add( BasicSequence.createAaSequence( "6", "AAAIACC" ) ); + l2.add( BasicSequence.createAaSequence( "7", "AAIIIIF" ) ); + l2.add( BasicSequence.createAaSequence( "8", "AIIIVVW" ) ); + l2.add( BasicSequence.createAaSequence( "9", "AAAAAAA" ) ); + l2.add( BasicSequence.createAaSequence( "10", "AAAIACC" ) ); + l2.add( BasicSequence.createAaSequence( "11", "AAIIIIF" ) ); + l2.add( BasicSequence.createAaSequence( "12", "AIIIVVW" ) ); + l2.add( BasicSequence.createAaSequence( "13", "AAIIIIF" ) ); + l2.add( BasicSequence.createAaSequence( "14", "AIIIVVW" ) ); + l2.add( BasicSequence.createAaSequence( "15", "AAAAAAA" ) ); + l2.add( BasicSequence.createAaSequence( "16", "AAAIACC" ) ); + l2.add( BasicSequence.createAaSequence( "17", "AAIIIIF" ) ); + l2.add( BasicSequence.createAaSequence( "18", "AIIIVVW" ) ); + l2.add( BasicSequence.createAaSequence( "19", "AAAAAAA" ) ); + l2.add( BasicSequence.createAaSequence( "20", "AAAIACC" ) ); + l2.add( BasicSequence.createAaSequence( "21", "AAIIIIF" ) ); + l2.add( BasicSequence.createAaSequence( "22", "AIIIVVW" ) ); + final Msa msa2 = BasicMsa.createInstance( l2 ); + System.out.println(); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa2, 0 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa2, 1 ) ); + System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa2, 2 ) ); + } + catch ( final Exception e ) { + e.printStackTrace( System.out ); + return false; + } + return true; + } + + private static boolean testDeleteableMsa() { + try { + final Sequence s0 = BasicSequence.createAaSequence( "a", "AAAA" ); + final Sequence s1 = BasicSequence.createAaSequence( "b", "BAAA" ); + final Sequence s2 = BasicSequence.createAaSequence( "c", "CAAA" ); + final Sequence s3 = BasicSequence.createAaSequence( "d", "DAAA" ); + final Sequence s4 = BasicSequence.createAaSequence( "e", "EAAA" ); + final Sequence s5 = BasicSequence.createAaSequence( "f", "FAAA" ); + final List l0 = new ArrayList(); + l0.add( s0 ); + l0.add( s1 ); + l0.add( s2 ); + l0.add( s3 ); + l0.add( s4 ); + l0.add( s5 ); + final DeleteableMsa dmsa0 = DeleteableMsa.createInstance( l0 ); + dmsa0.deleteRow( "b", false ); + if ( !dmsa0.getIdentifier( 1 ).equals( "c" ) ) { + return false; + } + dmsa0.deleteRow( "e", false ); + dmsa0.deleteRow( "a", false ); + dmsa0.deleteRow( "f", false ); + if ( dmsa0.getLength() != 4 ) { + return false; + } + if ( dmsa0.getNumberOfSequences() != 2 ) { + return false; + } + if ( !dmsa0.getIdentifier( 0 ).equals( "c" ) ) { + return false; + } + if ( !dmsa0.getIdentifier( 1 ).equals( "d" ) ) { + return false; + } + if ( dmsa0.getResidueAt( 0, 0 ) != 'C' ) { + return false; + } + if ( !dmsa0.getSequenceAsString( 0 ).toString().equals( "CAAA" ) ) { + return false; + } + if ( dmsa0.getColumnAt( 0 ).size() != 2 ) { + return false; + } + dmsa0.deleteRow( "c", false ); + dmsa0.deleteRow( "d", false ); + if ( dmsa0.getNumberOfSequences() != 0 ) { + return false; + } + // + final Sequence s_0 = BasicSequence.createAaSequence( "a", "--A---B-C--X----" ); + final Sequence s_1 = BasicSequence.createAaSequence( "b", "--B-----C-------" ); + final Sequence s_2 = BasicSequence.createAaSequence( "c", "--C--AB-C------Z" ); + final Sequence s_3 = BasicSequence.createAaSequence( "d", "--D--AA-C-------" ); + final Sequence s_4 = BasicSequence.createAaSequence( "e", "--E--AA-C-------" ); + final Sequence s_5 = BasicSequence.createAaSequence( "f", "--F--AB-CD--Y---" ); + final List l1 = new ArrayList(); + l1.add( s_0 ); + l1.add( s_1 ); + l1.add( s_2 ); + l1.add( s_3 ); + l1.add( s_4 ); + l1.add( s_5 ); + final DeleteableMsa dmsa1 = DeleteableMsa.createInstance( l1 ); + dmsa1.deleteGapOnlyColumns(); + dmsa1.deleteRow( "a", false ); + dmsa1.deleteRow( "f", false ); + dmsa1.deleteRow( "d", false ); + dmsa1.deleteGapOnlyColumns(); + if ( !dmsa1.getSequenceAsString( 0 ).toString().equals( "B--C-" ) ) { + return false; + } + if ( !dmsa1.getSequenceAsString( 1 ).toString().equals( "CABCZ" ) ) { + return false; + } + if ( !dmsa1.getSequenceAsString( 2 ).toString().equals( "EAAC-" ) ) { + return false; + } + dmsa1.deleteRow( "c", false ); + dmsa1.deleteGapOnlyColumns(); + final Writer w0 = new StringWriter(); + dmsa1.write( w0, MSA_FORMAT.FASTA ); + final Writer w1 = new StringWriter(); + dmsa1.write( w1, MSA_FORMAT.PHYLIP ); + if ( !dmsa1.getSequenceAsString( 0 ).toString().equals( "B--C" ) ) { + return false; + } + if ( !dmsa1.getSequenceAsString( 1 ).toString().equals( "EAAC" ) ) { + return false; + } + // + final Sequence s__0 = BasicSequence.createAaSequence( "a", "A------" ); + final Sequence s__1 = BasicSequence.createAaSequence( "b", "BB-----" ); + final Sequence s__2 = BasicSequence.createAaSequence( "c", "CCC----" ); + final Sequence s__3 = BasicSequence.createAaSequence( "d", "DDDD---" ); + final Sequence s__4 = BasicSequence.createAaSequence( "e", "EEEEE--" ); + final Sequence s__5 = BasicSequence.createAaSequence( "f", "FFFFFF-" ); + final List l2 = new ArrayList(); + l2.add( s__0 ); + l2.add( s__1 ); + l2.add( s__2 ); + l2.add( s__3 ); + l2.add( s__4 ); + l2.add( s__5 ); + final DeleteableMsa dmsa2 = DeleteableMsa.createInstance( l2 ); + dmsa2.deleteGapColumns( 0.5 ); + if ( !dmsa2.getSequenceAsString( 0 ).toString().equals( "A---" ) ) { + return false; + } + if ( !dmsa2.getSequenceAsString( 1 ).toString().equals( "BB--" ) ) { + return false; + } + if ( !dmsa2.getSequenceAsString( 2 ).toString().equals( "CCC-" ) ) { + return false; + } + dmsa2.deleteGapColumns( 0.2 ); + if ( !dmsa2.getSequenceAsString( 0 ).toString().equals( "A-" ) ) { + return false; + } + if ( !dmsa2.getSequenceAsString( 1 ).toString().equals( "BB" ) ) { + return false; + } + if ( !dmsa2.getSequenceAsString( 2 ).toString().equals( "CC" ) ) { + return false; + } + dmsa2.deleteGapColumns( 0 ); + dmsa2.deleteRow( "a", false ); + dmsa2.deleteRow( "b", false ); + dmsa2.deleteRow( "f", false ); + dmsa2.deleteRow( "e", false ); + dmsa2.setIdentifier( 0, "new_c" ); + dmsa2.setIdentifier( 1, "new_d" ); + dmsa2.setResidueAt( 0, 0, 'x' ); + final Sequence s = dmsa2.deleteRow( "new_d", true ); + if ( !s.getMolecularSequenceAsString().equals( "D" ) ) { + return false; + } + final Writer w = new StringWriter(); + dmsa2.write( w, MSA_FORMAT.PHYLIP ); + final String phylip = w.toString(); + if ( !phylip.equals( "1 1" + ForesterUtil.LINE_SEPARATOR + "new_c x" + ForesterUtil.LINE_SEPARATOR ) ) { + System.out.println( phylip ); + return false; + } + final Writer w2 = new StringWriter(); + dmsa2.write( w2, MSA_FORMAT.FASTA ); + final String fasta = w2.toString(); + if ( !fasta.equals( ">new_c" + ForesterUtil.LINE_SEPARATOR + "x" + ForesterUtil.LINE_SEPARATOR ) ) { + System.out.println( fasta ); + return false; + } + } + catch ( final Exception e ) { + e.printStackTrace( System.out ); + return false; + } + return true; + } + private static boolean testNextNodeWithCollapsing() { try { final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance(); @@ -6629,6 +7277,35 @@ public final class Test { if ( phylogenies[ 17 ].getNumberOfExternalNodes() != 10 ) { return false; } + final NexusPhylogeniesParser p2 = new NexusPhylogeniesParser(); + phylogenies = null; + phylogenies = factory.create( Test.PATH_TO_TEST_DATA + "S15613.nex", p2 ); + if ( phylogenies.length != 9 ) { + return false; + } + if ( !isEqual( 0.48039661496919533, phylogenies[ 0 ].getNode( "Diadocidia_spinosula" ) + .getDistanceToParent() ) ) { + return false; + } + if ( !isEqual( 0.3959796191512233, phylogenies[ 0 ].getNode( "Diadocidia_stanfordensis" ) + .getDistanceToParent() ) ) { + return false; + } + if ( !phylogenies[ 0 ].getName().equals( "Family Diadocidiidae MLT (Imported_tree_0)" ) ) { + return false; + } + if ( !phylogenies[ 1 ].getName().equals( "Family Diadocidiidae BAT (con_50_majrule)" ) ) { + return false; + } + if ( !phylogenies[ 2 ].getName().equals( "Family Diadocidiidae BAT (con_50_majrule)" ) ) { + return false; + } + if ( !isEqual( 0.065284, phylogenies[ 7 ].getNode( "Bradysia_amoena" ).getDistanceToParent() ) ) { + return false; + } + if ( !isEqual( 0.065284, phylogenies[ 8 ].getNode( "Bradysia_amoena" ).getDistanceToParent() ) ) { + return false; + } } catch ( final Exception e ) { e.printStackTrace( System.out ); @@ -6727,7 +7404,7 @@ public final class Test { if ( phy != null ) { return false; } - //// + // p.setSource( Test.PATH_TO_TEST_DATA + "nexus_test_3.nex" ); if ( !p.hasNext() ) { return false; @@ -6774,15 +7451,12 @@ public final class Test { if ( phy != null ) { return false; } - //// + // p.setSource( Test.PATH_TO_TEST_DATA + "nexus_test_4_1.nex" ); - // if ( phylogenies.length != 18 ) { - // return false; - // } - //0 if ( !p.hasNext() ) { return false; } + //0 phy = p.next(); if ( phy == null ) { return false; @@ -6816,6 +7490,7 @@ public final class Test { return false; } if ( phy.getNumberOfExternalNodes() != 3 ) { + System.out.println( phy.toString() ); return false; } if ( !phy.getName().equals( "" ) ) { @@ -7193,6 +7868,82 @@ public final class Test { if ( phy.isRooted() ) { return false; } + // + final NexusPhylogeniesParser p2 = new NexusPhylogeniesParser(); + p2.setSource( Test.PATH_TO_TEST_DATA + "S15613.nex" ); + // 0 + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + if ( !isEqual( 0.48039661496919533, phy.getNode( "Diadocidia_spinosula" ).getDistanceToParent() ) ) { + return false; + } + if ( !isEqual( 0.3959796191512233, phy.getNode( "Diadocidia_stanfordensis" ).getDistanceToParent() ) ) { + return false; + } + // 1 + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + // 2 + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + // 3 + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + // 4 + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + // 5 + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + // 6 + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + // 7 + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + // 8 + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + if ( !isEqual( 0.065284, phy.getNode( "Bradysia_amoena" ).getDistanceToParent() ) ) { + return false; + } + if ( p2.hasNext() ) { + return false; + } + phy = p2.next(); + if ( phy != null ) { + return false; + } + // 0 + p2.reset(); + if ( !p2.hasNext() ) { + return false; + } + phy = p2.next(); + if ( !isEqual( 0.48039661496919533, phy.getNode( "Diadocidia_spinosula" ).getDistanceToParent() ) ) { + return false; + } + if ( !isEqual( 0.3959796191512233, phy.getNode( "Diadocidia_stanfordensis" ).getDistanceToParent() ) ) { + return false; + } } catch ( final Exception e ) { e.printStackTrace( System.out ); @@ -7349,6 +8100,14 @@ public final class Test { .equals( "Aranaeus" ) ) { return false; } + phylogenies = factory.create( Test.PATH_TO_TEST_DATA + "S14117.nex", parser ); + if ( phylogenies.length != 3 ) { + return false; + } + if ( !isEqual( phylogenies[ 2 ].getNode( "Aloysia lycioides 251-76-02169" ).getDistanceToParent(), + 0.00100049 ) ) { + return false; + } } catch ( final Exception e ) { e.printStackTrace( System.out ); @@ -7368,10 +8127,10 @@ public final class Test { nhxp.setTaxonomyExtraction( NHXParser.TAXONOMY_EXTRACTION.NO ); nhxp.setReplaceUnderscores( true ); final Phylogeny uc0 = factory.create( "(A__A_,_B_B)", nhxp )[ 0 ]; - if ( !uc0.getRoot().getChildNode( 0 ).getName().equals( "A A " ) ) { + if ( !uc0.getRoot().getChildNode( 0 ).getName().equals( "A A" ) ) { return false; } - if ( !uc0.getRoot().getChildNode( 1 ).getName().equals( " B B" ) ) { + if ( !uc0.getRoot().getChildNode( 1 ).getName().equals( "B B" ) ) { return false; } final Phylogeny p1b = factory @@ -7662,14 +8421,14 @@ public final class Test { if ( p50.getNode( "A" ) == null ) { return false; } - if ( !p50.toNewHampshire( false, NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS ) + if ( !p50.toNewHampshire( NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS ) .equals( "((A,B)ab:2.0[88],C);" ) ) { return false; } - if ( !p50.toNewHampshire( false, NH_CONVERSION_SUPPORT_VALUE_STYLE.NONE ).equals( "((A,B)ab:2.0,C);" ) ) { + if ( !p50.toNewHampshire( NH_CONVERSION_SUPPORT_VALUE_STYLE.NONE ).equals( "((A,B)ab:2.0,C);" ) ) { return false; } - if ( !p50.toNewHampshire( false, NH_CONVERSION_SUPPORT_VALUE_STYLE.AS_INTERNAL_NODE_NAMES ) + if ( !p50.toNewHampshire( NH_CONVERSION_SUPPORT_VALUE_STYLE.AS_INTERNAL_NODE_NAMES ) .equals( "((A,B)88:2.0,C);" ) ) { return false; } @@ -7687,13 +8446,63 @@ public final class Test { if ( p53.getNode( "B (x (a' ,b) f(x);" ) == null ) { return false; } - // final Phylogeny p54 = factory.create( new StringBuffer( "((A,B):[88],C)" ), new NHXParser() )[ 0 ]; if ( p54.getNode( "A" ) == null ) { return false; } - if ( !p54.toNewHampshire( false, NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS ) - .equals( "((A,B)[88],C);" ) ) { + if ( !p54.toNewHampshire( NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS ).equals( "((A,B)[88],C);" ) ) { + return false; + } + final Phylogeny p55 = factory + .create( new StringBuffer( "((\"lcl|HPV32_L1.:1 s\":0.195593,\"lcl|HPV30_L1.1|;a\":0.114237):0.0359322,\"lcl|HPV56_L1.1|,d\":0.0727412,\"lcl|HPV66_L1.1x\":0.0798012);" ), + new NHXParser() )[ 0 ]; + if ( !p55 + .toNewHampshire() + .equals( "(('lcl|HPV32_L1.:1 s':0.195593,'lcl|HPV30_L1.1|;a':0.114237):0.0359322,'lcl|HPV56_L1.1|,d':0.0727412,lcl|HPV66_L1.1x:0.0798012);" ) ) { + System.out.println( p55.toNewHampshire() ); + return false; + } + final Phylogeny p56 = factory + .create( new StringBuffer( "((\"lcl|HPV32_L1.:1 s\":0.195593,\"lcl|HPV30_L1.1|;a\":0.114\n237):0.0359322,\"lcl|HPV56_L1.1|,d\":0.0727412,\"lcl|HPV66_L1.1:x\":0.0798012);" ), + new NHXParser() )[ 0 ]; + if ( !p56 + .toNewHampshire() + .equals( "(('lcl|HPV32_L1.:1 s':0.195593,'lcl|HPV30_L1.1|;a':0.114237):0.0359322,'lcl|HPV56_L1.1|,d':0.0727412,'lcl|HPV66_L1.1:x':0.0798012);" ) ) { + System.out.println( p56.toNewHampshire() ); + return false; + } + final Phylogeny p57 = factory + .create( new StringBuffer( "((\"lcl|HPV32_L1.:1 s\":0.195593,\"lcl|HPV30_L1.1|;a\":0.114\n237):0.0359322,\"lcl|HPV56_L1.1|,d\":0.0727412,\"lcl|HPV66_L1.1:x\":0.0798012);" ), + new NHXParser() )[ 0 ]; + if ( !p57 + .toNewHampshire() + .equals( "(('lcl|HPV32_L1.:1 s':0.195593,'lcl|HPV30_L1.1|;a':0.114237):0.0359322,'lcl|HPV56_L1.1|,d':0.0727412,'lcl|HPV66_L1.1:x':0.0798012);" ) ) { + System.out.println( p56.toNewHampshire() ); + return false; + } + final String s58 = "('Homo \"man\" sapiens:1',\"Homo 'man' sapiens;\")';root \"1_ )';"; + final Phylogeny p58 = factory.create( new StringBuffer( s58 ), new NHXParser() )[ 0 ]; + if ( !p58.toNewHampshire().equals( s58 ) ) { + System.out.println( p58.toNewHampshire() ); + return false; + } + final String s59 = "('Homo \"man sapiens:1',\"Homo 'man sapiens\")\"root; '1_ )\";"; + final Phylogeny p59 = factory.create( new StringBuffer( s59 ), new NHXParser() )[ 0 ]; + if ( !p59.toNewHampshire().equals( s59 ) ) { + System.out.println( p59.toNewHampshire() ); + return false; + } + final String s60 = "('\" ;,:\":\"',\"'abc def' g's_\",'=:0.45+,.:%~`!@#$%^&*()_-+={} | ;,');"; + final Phylogeny p60 = factory.create( new StringBuffer( s60 ), new NHXParser() )[ 0 ]; + if ( !p60.toNewHampshire().equals( s60 ) ) { + System.out.println( p60.toNewHampshire() ); + return false; + } + final String s61 = "('H[omo] \"man\" sapiens:1',\"H[omo] 'man' sapiens;\",H[omo] sapiens)';root \"1_ )';"; + final Phylogeny p61 = factory.create( new StringBuffer( s61 ), new NHXParser() )[ 0 ]; + if ( !p61.toNewHampshire() + .equals( "('H{omo} \"man\" sapiens:1',\"H{omo} 'man' sapiens;\",Hsapiens)';root \"1_ )';" ) ) { + System.out.println( p61.toNewHampshire() ); return false; } } @@ -8184,6 +8993,14 @@ public final class Test { System.out.println( n6.toNewHampshireX() ); return false; } + final PhylogenyNode n7 = new PhylogenyNode(); + n7.setName( " gks:dr-m4 \" ' `@:[]sadq04 " ); + if ( !n7.toNewHampshire( true, PhylogenyNode.NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS ) + .equals( "'gks:dr-m4 \" ` `@:[]sadq04'" ) ) { + System.out.println( n7 + .toNewHampshire( true, PhylogenyNode.NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS ) ); + return false; + } } catch ( final Exception e ) { e.printStackTrace( System.out ); @@ -8620,6 +9437,12 @@ public final class Test { if ( !p10.toNewHampshireX().equals( "((A:0.2,B:0.3):0.5[&&NHX:B=91],C:0.1)root:0.1[&&NHX:B=100]" ) ) { return false; } + final Phylogeny p11 = factory + .create( " [79] ( ('A: \" ' [co mment] :0 .2[comment],B:0.3[com])[com ment]: 0. 5 \t[ 9 1 ][ comment],C: 0.1)[comment]root:0.1[100] [comment]", + new NHXParser() )[ 0 ]; + if ( !p11.toNewHampshireX().equals( "(('A: \"':0.2,B:0.3):0.5[&&NHX:B=91],C:0.1)root:0.1[&&NHX:B=100]" ) ) { + return false; + } } catch ( final Exception e ) { e.printStackTrace( System.out ); @@ -8710,13 +9533,13 @@ public final class Test { if ( phy.getNodes( "'single quotes' inside double quotes" ).size() != 1 ) { return false; } - if ( phy.getNodes( "double quotes inside single quotes" ).size() != 1 ) { + if ( phy.getNodes( "\"double quotes\" inside single quotes" ).size() != 1 ) { return false; } if ( phy.getNodes( "noquotes" ).size() != 1 ) { return false; } - if ( phy.getNodes( "A ( B C '" ).size() != 1 ) { + if ( phy.getNodes( "A ( B C '" ).size() != 1 ) { return false; } final NHXParser p1p = new NHXParser(); @@ -8746,7 +9569,7 @@ public final class Test { final Phylogeny p10 = factory .create( " [79] ( (\"A \n\tB \" [co mment] :0 .2[comment],'B':0.3[com])[com ment]: 0. 5 \t[ 9 1 ][ comment],'C (or D?\\//;,))': 0.1)[comment]'\nroot is here (cool, was! ) ':0.1[100] [comment]", new NHXParser() )[ 0 ]; - final String p10_clean_str = "(('A B':0.2,B:0.3):0.5[&&NHX:B=91],'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1[&&NHX:B=100]"; + final String p10_clean_str = "(('A B':0.2,B:0.3):0.5[&&NHX:B=91],'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1[&&NHX:B=100]"; if ( !p10.toNewHampshireX().equals( p10_clean_str ) ) { return false; } @@ -8754,11 +9577,10 @@ public final class Test { if ( !p11.toNewHampshireX().equals( p10_clean_str ) ) { return false; } - // final Phylogeny p12 = factory .create( " [79] ( (\"A \n\tB \" [[][] :0 .2[comment][\t&\t&\n N\tH\tX:S=mo\tnkey !],'\tB\t\b\t\n\f\rB B ':0.0\b3[])\t[com ment]: 0. 5 \t[ 9 1 ][ \ncomment],'C\t (or D?\\//;,))': 0.\b1)[comment]'\nroot \tis here (cool, \b\t\n\f\r was! ) ':0.1[100] [comment]", new NHXParser() )[ 0 ]; - final String p12_clean_str = "(('A B':0.2[&&NHX:S=monkey!],'BB B':0.03):0.5[&&NHX:B=91],'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1[&&NHX:B=100]"; + final String p12_clean_str = "(('A B':0.2[&&NHX:S=monkey!],'BB B':0.03):0.5[&&NHX:B=91],'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1[&&NHX:B=100]"; if ( !p12.toNewHampshireX().equals( p12_clean_str ) ) { return false; } @@ -8766,7 +9588,7 @@ public final class Test { if ( !p13.toNewHampshireX().equals( p12_clean_str ) ) { return false; } - final String p12_clean_str_nh = "(('A B':0.2,'BB B':0.03):0.5,'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1;"; + final String p12_clean_str_nh = "(('A B':0.2,'BB B':0.03):0.5,'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1;"; if ( !p13.toNewHampshire().equals( p12_clean_str_nh ) ) { return false; } @@ -10502,7 +11324,6 @@ public final class Test { } return false; } - // id = SequenceAccessionTools.parseAccessorFromString( "segmented worms|gb_ADF31344" ); if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) || !id.getValue().equals( "ADF31344" ) || !id.getSource().equals( "ncbi" ) ) { @@ -10512,7 +11333,6 @@ public final class Test { } return false; } - // id = SequenceAccessionTools.parseAccessorFromString( "segmented worms gb_ADF31344 and more" ); if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) || !id.getValue().equals( "ADF31344" ) || !id.getSource().equals( "ncbi" ) ) { @@ -10522,7 +11342,6 @@ public final class Test { } return false; } - // id = SequenceAccessionTools.parseAccessorFromString( "gb_AAA96518_1" ); if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) || !id.getValue().equals( "AAA96518" ) || !id.getSource().equals( "ncbi" ) ) { @@ -10532,7 +11351,6 @@ public final class Test { } return false; } - // id = SequenceAccessionTools.parseAccessorFromString( "gb_EHB07727_1_rodents_" ); if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) || !id.getValue().equals( "EHB07727" ) || !id.getSource().equals( "ncbi" ) ) { @@ -10542,7 +11360,6 @@ public final class Test { } return false; } - // id = SequenceAccessionTools.parseAccessorFromString( "dbj_BAF37827_1_turtles_" ); if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) || !id.getValue().equals( "BAF37827" ) || !id.getSource().equals( "ncbi" ) ) { @@ -10552,7 +11369,6 @@ public final class Test { } return false; } - // id = SequenceAccessionTools.parseAccessorFromString( "emb_CAA73223_1_primates_" ); if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) || !id.getValue().equals( "CAA73223" ) || !id.getSource().equals( "ncbi" ) ) { @@ -10562,7 +11378,6 @@ public final class Test { } return false; } - // id = SequenceAccessionTools.parseAccessorFromString( "mites|ref_XP_002434188_1" ); if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) || !id.getValue().equals( "XP_002434188" ) || !id.getSource().equals( "refseq" ) ) { @@ -10572,7 +11387,6 @@ public final class Test { } return false; } - // id = SequenceAccessionTools.parseAccessorFromString( "mites_ref_XP_002434188_1_bla_XP_12345" ); if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) || !id.getValue().equals( "XP_002434188" ) || !id.getSource().equals( "refseq" ) ) { @@ -10582,7 +11396,6 @@ public final class Test { } return false; } - // id = SequenceAccessionTools.parseAccessorFromString( "P4A123" ); if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) || !id.getValue().equals( "P4A123" ) || !id.getSource().equals( "uniprot" ) ) { @@ -10598,6 +11411,40 @@ public final class Test { System.out.println( "provider=" + id.getSource() ); return false; } + // + id = SequenceAccessionTools.parseAccessorFromString( "N3B004Z009" ); + if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) + || !id.getValue().equals( "N3B004Z009" ) || !id.getSource().equals( "uniprot" ) ) { + if ( id != null ) { + System.out.println( "value =" + id.getValue() ); + System.out.println( "provider=" + id.getSource() ); + } + return false; + } + id = SequenceAccessionTools.parseAccessorFromString( "A4CAA4ZBB9" ); + if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) + || !id.getValue().equals( "A4CAA4ZBB9" ) || !id.getSource().equals( "uniprot" ) ) { + if ( id != null ) { + System.out.println( "value =" + id.getValue() ); + System.out.println( "provider=" + id.getSource() ); + } + return false; + } + id = SequenceAccessionTools.parseAccessorFromString( "ecoli_A4CAA4ZBB9_rt" ); + if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() ) + || !id.getValue().equals( "A4CAA4ZBB9" ) || !id.getSource().equals( "uniprot" ) ) { + if ( id != null ) { + System.out.println( "value =" + id.getValue() ); + System.out.println( "provider=" + id.getSource() ); + } + return false; + } + id = SequenceAccessionTools.parseAccessorFromString( "Q4CAA4ZBB9" ); + if ( id != null ) { + System.out.println( "value =" + id.getValue() ); + System.out.println( "provider=" + id.getSource() ); + return false; + } } catch ( final Exception e ) { e.printStackTrace( System.out ); @@ -11664,6 +12511,98 @@ public final class Test { System.out.println( n13.toString() ); return false; } + final PhylogenyNode n14 = PhylogenyNode + .createInstanceFromNhxString( "Mus_musculus_392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n14.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus" ) ) { + System.out.println( n14.toString() ); + return false; + } + final PhylogenyNode n15 = PhylogenyNode + .createInstanceFromNhxString( "Mus_musculus_K392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n15.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus" ) ) { + System.out.println( n15.toString() ); + return false; + } + final PhylogenyNode n16 = PhylogenyNode + .createInstanceFromNhxString( "Mus musculus 392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n16.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus" ) ) { + System.out.println( n16.toString() ); + return false; + } + final PhylogenyNode n17 = PhylogenyNode + .createInstanceFromNhxString( "Mus musculus K392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n17.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus" ) ) { + System.out.println( n17.toString() ); + return false; + } + // + final PhylogenyNode n18 = PhylogenyNode + .createInstanceFromNhxString( "Mus_musculus_musculus_392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n18.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus musculus" ) ) { + System.out.println( n18.toString() ); + return false; + } + final PhylogenyNode n19 = PhylogenyNode + .createInstanceFromNhxString( "Mus_musculus_musculus_K392", + NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n19.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus musculus" ) ) { + System.out.println( n19.toString() ); + return false; + } + final PhylogenyNode n20 = PhylogenyNode + .createInstanceFromNhxString( "Mus musculus musculus 392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n20.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus musculus" ) ) { + System.out.println( n20.toString() ); + return false; + } + final PhylogenyNode n21 = PhylogenyNode + .createInstanceFromNhxString( "Mus musculus musculus K392", + NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n21.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus musculus" ) ) { + System.out.println( n21.toString() ); + return false; + } + final PhylogenyNode n22 = PhylogenyNode + .createInstanceFromNhxString( "NEMVE_Nematostella_vectensis", + NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n22.getNodeData().getTaxonomy().getTaxonomyCode().equals( "NEMVE" ) ) { + System.out.println( n22.toString() ); + return false; + } + final PhylogenyNode n23 = PhylogenyNode + .createInstanceFromNhxString( "9EMVE_Nematostella_vectensis", + NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n23.getNodeData().getTaxonomy().getScientificName().equals( "Nematostella vectensis" ) ) { + System.out.println( n23.toString() ); + return false; + } + final PhylogenyNode n24 = PhylogenyNode + .createInstanceFromNhxString( "9EMVE_Nematostella", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n24.getNodeData().getTaxonomy().getTaxonomyCode().equals( "9EMVE" ) ) { + System.out.println( n24.toString() ); + return false; + } + // + final PhylogenyNode n25 = PhylogenyNode + .createInstanceFromNhxString( "Nematostella_vectensis_NEMVE", + NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n25.getNodeData().getTaxonomy().getTaxonomyCode().equals( "NEMVE" ) ) { + System.out.println( n25.toString() ); + return false; + } + final PhylogenyNode n26 = PhylogenyNode + .createInstanceFromNhxString( "Nematostella_vectensis_9EMVE", + NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n26.getNodeData().getTaxonomy().getScientificName().equals( "Nematostella vectensis" ) ) { + System.out.println( n26.toString() ); + return false; + } + final PhylogenyNode n27 = PhylogenyNode + .createInstanceFromNhxString( "Nematostella_9EMVE", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE ); + if ( !n27.getNodeData().getTaxonomy().getTaxonomyCode().equals( "9EMVE" ) ) { + System.out.println( n27.toString() ); + return false; + } } catch ( final Exception e ) { e.printStackTrace( System.out );