// FORESTER -- software libraries and applications
// for evolutionary biology research and applications.
//
-// Copyright (C) 2008-2009 Christian M. Zmasek
-// Copyright (C) 2008-2009 Burnham Institute for Medical Research
+// Copyright (C) 2014 Christian M. Zmasek
+// Copyright (C) 2014 Sanford-Burnham Medical Research Institute
// All rights reserved
//
// This library is free software; you can redistribute it and/or
// License along with this library; if not, write to the Free Software
// Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
//
-// Contact: phylosoft @ gmail . com
// WWW: https://sites.google.com/site/cmzmasek/home/software/forester
package org.forester.test;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
+import java.io.StringWriter;
+import java.io.Writer;
+import java.net.URL;
import java.util.ArrayList;
import java.util.Date;
import java.util.HashSet;
import java.util.List;
import java.util.Locale;
import java.util.Set;
+import java.util.SortedSet;
import org.forester.application.support_transfer;
import org.forester.archaeopteryx.AptxUtil;
+import org.forester.archaeopteryx.TreePanelUtil;
+import org.forester.archaeopteryx.webservices.WebserviceUtil;
import org.forester.development.DevelopmentTools;
import org.forester.evoinference.TestPhylogenyReconstruction;
import org.forester.evoinference.matrix.character.CharacterStateMatrix;
import org.forester.io.writers.PhylogenyWriter;
import org.forester.io.writers.SequenceWriter;
import org.forester.msa.BasicMsa;
+import org.forester.msa.DeleteableMsa;
import org.forester.msa.Mafft;
import org.forester.msa.Msa;
+import org.forester.msa.Msa.MSA_FORMAT;
import org.forester.msa.MsaInferrer;
import org.forester.msa.MsaMethods;
import org.forester.pccx.TestPccx;
import org.forester.phylogeny.PhylogenyNode;
import org.forester.phylogeny.PhylogenyNode.NH_CONVERSION_SUPPORT_VALUE_STYLE;
import org.forester.phylogeny.data.Accession;
+import org.forester.phylogeny.data.Accession.Source;
import org.forester.phylogeny.data.BinaryCharacters;
import org.forester.phylogeny.data.BranchWidth;
import org.forester.phylogeny.data.Confidence;
import org.forester.protein.BasicDomain;
import org.forester.protein.BasicProtein;
import org.forester.protein.Domain;
-import org.forester.protein.DomainId;
import org.forester.protein.Protein;
import org.forester.protein.ProteinId;
import org.forester.rio.TestRIO;
import org.forester.sdi.SDIR;
import org.forester.sdi.TestGSDI;
import org.forester.sequence.BasicSequence;
-import org.forester.sequence.Sequence;
+import org.forester.sequence.MolecularSequence;
import org.forester.species.BasicSpecies;
import org.forester.species.Species;
import org.forester.surfacing.TestSurfacing;
import org.forester.util.ForesterConstants;
import org.forester.util.ForesterUtil;
import org.forester.util.GeneralTable;
-import org.forester.util.SequenceIdParser;
+import org.forester.util.SequenceAccessionTools;
import org.forester.ws.seqdb.SequenceDatabaseEntry;
import org.forester.ws.seqdb.SequenceDbWsTools;
import org.forester.ws.seqdb.UniProtTaxonomy;
@SuppressWarnings( "unused")
public final class Test {
- private final static double ZERO_DIFF = 1.0E-9;
- private final static String PATH_TO_TEST_DATA = System.getProperty( "user.dir" )
- + ForesterUtil.getFileSeparator() + "test_data"
- + ForesterUtil.getFileSeparator();
private final static String PATH_TO_RESOURCES = System.getProperty( "user.dir" )
- + ForesterUtil.getFileSeparator() + "resources"
- + ForesterUtil.getFileSeparator();
- private final static boolean USE_LOCAL_PHYLOXML_SCHEMA = true;
- private static final String PHYLOXML_REMOTE_XSD = ForesterConstants.PHYLO_XML_LOCATION + "/"
- + ForesterConstants.PHYLO_XML_VERSION + "/"
- + ForesterConstants.PHYLO_XML_XSD;
+ + ForesterUtil.getFileSeparator() + "resources"
+ + ForesterUtil.getFileSeparator();
+ private final static String PATH_TO_TEST_DATA = System.getProperty( "user.dir" )
+ + ForesterUtil.getFileSeparator() + "test_data"
+ + ForesterUtil.getFileSeparator();
+ private final static boolean PERFORM_DB_TESTS = true;
+ private static final boolean PERFORM_WEB_TREE_ACCESS = true;
private static final String PHYLOXML_LOCAL_XSD = PATH_TO_RESOURCES + "phyloxml_schema/"
- + ForesterConstants.PHYLO_XML_VERSION + "/"
- + ForesterConstants.PHYLO_XML_XSD;
+ + ForesterConstants.PHYLO_XML_VERSION + "/"
+ + ForesterConstants.PHYLO_XML_XSD;
+ private static final String PHYLOXML_REMOTE_XSD = ForesterConstants.PHYLO_XML_LOCATION + "/"
+ + ForesterConstants.PHYLO_XML_VERSION + "/"
+ + ForesterConstants.PHYLO_XML_XSD;
+ private final static boolean USE_LOCAL_PHYLOXML_SCHEMA = true;
+ private final static double ZERO_DIFF = 1.0E-9;
public static boolean isEqual( final double a, final double b ) {
return ( ( Math.abs( a - b ) ) < Test.ZERO_DIFF );
public static void main( final String[] args ) {
System.out.println( "[Java version: " + ForesterUtil.JAVA_VERSION + " " + ForesterUtil.JAVA_VENDOR + "]" );
System.out.println( "[OS: " + ForesterUtil.OS_NAME + " " + ForesterUtil.OS_ARCH + " " + ForesterUtil.OS_VERSION
- + "]" );
+ + "]" );
Locale.setDefault( Locale.US );
System.out.println( "[Locale: " + Locale.getDefault() + "]" );
int failed = 0;
System.exit( -1 );
}
final long start_time = new Date().getTime();
- System.out.print( "Domain id: " );
- if ( !testDomainId() ) {
- System.out.println( "failed." );
- failed++;
+ System.out.print( "Basic node methods: " );
+ if ( Test.testBasicNodeMethods() ) {
+ System.out.println( "OK." );
+ succeeded++;
}
else {
- succeeded++;
+ System.out.println( "failed." );
+ failed++;
}
- System.out.println( "OK." );
System.out.print( "Protein id: " );
if ( !testProteinId() ) {
System.out.println( "failed." );
System.out.println( "failed." );
failed++;
}
+ System.out.print( "UniProtKB id extraction: " );
+ if ( Test.testExtractUniProtKbProteinSeqIdentifier() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ System.out.print( "Sequence DB tools 1: " );
+ if ( testSequenceDbWsTools1() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
System.out.print( "Hmmscan output parser: " );
if ( testHmmscanOutputParser() ) {
System.out.println( "OK." );
System.out.println( "failed." );
failed++;
}
- System.out.print( "Basic node methods: " );
- if ( Test.testBasicNodeMethods() ) {
+ System.out.print( "Overlap removal: " );
+ if ( !org.forester.test.Test.testOverlapRemoval() ) {
+ System.out.println( "failed." );
+ failed++;
+ }
+ else {
+ succeeded++;
+ }
+ System.out.println( "OK." );
+ System.out.print( "Engulfing overlap removal: " );
+ if ( !Test.testEngulfingOverlapRemoval() ) {
+ System.out.println( "failed." );
+ failed++;
+ }
+ else {
+ succeeded++;
+ }
+ System.out.println( "OK." );
+ System.out.print( "Taxonomy data extraction: " );
+ if ( Test.testExtractTaxonomyDataFromNodeName() ) {
System.out.println( "OK." );
succeeded++;
}
System.out.println( "failed." );
failed++;
}
- System.out.print( "UniProtKB id extraction: " );
- if ( Test.testExtractUniProtKbProteinSeqIdentifier() ) {
- System.out.println( "OK." );
- succeeded++;
- }
- else {
- System.out.println( "failed." );
- failed++;
- }
System.out.print( "Uri for Aptx web sequence accession: " );
if ( Test.testCreateUriForSeqWeb() ) {
System.out.println( "OK." );
System.out.println( "failed." );
failed++;
}
+ System.out.print( "Tree copy: " );
+ if ( Test.testTreeCopy() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
System.out.print( "Basic tree methods: " );
if ( Test.testBasicTreeMethods() ) {
System.out.println( "OK." );
System.out.println( "failed." );
failed++;
}
- System.out.print( "EMBL Entry Retrieval: " );
- if ( Test.testEmblEntryRetrieval() ) {
- System.out.println( "OK." );
- succeeded++;
- }
- else {
- System.out.println( "failed." );
- failed++;
- }
- System.out.print( "Uniprot Entry Retrieval: " );
- if ( Test.testUniprotEntryRetrieval() ) {
- System.out.println( "OK." );
- succeeded++;
- }
- else {
- System.out.println( "failed." );
- failed++;
- }
- System.out.print( "Uniprot Taxonomy Search: " );
- if ( Test.testUniprotTaxonomySearch() ) {
+ System.out.print( "Genbank accessor parsing: " );
+ if ( Test.testGenbankAccessorParsing() ) {
System.out.println( "OK." );
succeeded++;
}
System.out.println( "failed." );
failed++;
}
- //----
String path = "";
final String os = ForesterUtil.OS_NAME.toLowerCase();
if ( ( os.indexOf( "mac" ) >= 0 ) && ( os.indexOf( "os" ) > 0 ) ) {
path = "C:\\Program Files\\mafft-win\\mafft.bat";
}
else {
- path = "/home/czmasek/bin/mafft";
- }
- if ( !MsaInferrer.isInstalled( path ) ) {
path = "mafft";
- }
- if ( !MsaInferrer.isInstalled( path ) ) {
- path = "/usr/local/bin/mafft";
+ if ( !MsaInferrer.isInstalled( path ) ) {
+ path = "/usr/bin/mafft";
+ }
+ if ( !MsaInferrer.isInstalled( path ) ) {
+ path = "/usr/local/bin/mafft";
+ }
}
if ( MsaInferrer.isInstalled( path ) ) {
System.out.print( "MAFFT (external program): " );
System.out.println( "failed [will not count towards failed tests]" );
}
}
- //----
System.out.print( "Next nodes with collapsed: " );
if ( Test.testNextNodeWithCollapsing() ) {
System.out.println( "OK." );
System.out.println( "failed." );
failed++;
}
+ System.out.print( "Deleteable MSA: " );
+ if ( Test.testDeleteableMsa() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ System.out.print( "MSA entropy: " );
+ if ( Test.testMsaEntropy() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ if ( PERFORM_DB_TESTS ) {
+ System.out.print( "Uniprot Entry Retrieval: " );
+ if ( Test.testUniprotEntryRetrieval() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ System.out.print( "Ebi Entry Retrieval: " );
+ if ( Test.testEbiEntryRetrieval() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ System.out.print( "Sequence DB tools 2: " );
+ if ( testSequenceDbWsTools2() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ System.exit( -1 );
+ }
+ System.out.print( "Uniprot Taxonomy Search: " );
+ if ( Test.testUniprotTaxonomySearch() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ }
+ if ( PERFORM_WEB_TREE_ACCESS ) {
+ System.out.print( "NHX parsing from URL: " );
+ if ( Test.testNHXparsingFromURL() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ System.out.print( "NHX parsing from URL 2: " );
+ if ( Test.testNHXparsingFromURL2() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ System.out.print( "phyloXML parsing from URL: " );
+ if ( Test.testPhyloXMLparsingFromURL() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ System.out.print( "TreeBase acccess: " );
+ if ( Test.testTreeBaseReading() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ //
+ System.out.print( "ToL access: " );
+ if ( Test.testToLReading() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ //
+ System.out.print( "TreeFam access: " );
+ if ( Test.testTreeFamReading() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ //
+ //
+ System.out.print( "Pfam tree access: " );
+ if ( Test.testPfamTreeReading() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
+ }
System.out.println();
final Runtime rt = java.lang.Runtime.getRuntime();
final long free_memory = rt.freeMemory() / 1000000;
}
}
- private final static Phylogeny createPhylogeny( final String nhx ) throws IOException {
- final Phylogeny p = ParserBasedPhylogenyFactory.getInstance().create( nhx, new NHXParser() )[ 0 ];
- return p;
- }
-
- private final static Event getEvent( final Phylogeny p, final String n1, final String n2 ) {
- return PhylogenyMethods.calculateLCA( p.getNode( n1 ), p.getNode( n2 ) ).getNodeData().getEvent();
- }
-
- private static boolean testAminoAcidSequence() {
+ public static boolean testEngulfingOverlapRemoval() {
try {
- final Sequence aa1 = BasicSequence.createAaSequence( "aa1", "aAklm-?xX*z$#" );
- if ( aa1.getLength() != 13 ) {
- return false;
- }
- if ( aa1.getResidueAt( 0 ) != 'A' ) {
- return false;
- }
- if ( aa1.getResidueAt( 2 ) != 'K' ) {
- return false;
- }
- if ( !new String( aa1.getMolecularSequence() ).equals( "AAKLM-XXX*ZXX" ) ) {
+ final Domain d0 = new BasicDomain( "d0", 0, 8, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d1 = new BasicDomain( "d1", 0, 1, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d2 = new BasicDomain( "d2", 0, 2, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d3 = new BasicDomain( "d3", 7, 8, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d4 = new BasicDomain( "d4", 7, 9, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d5 = new BasicDomain( "d4", 0, 9, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d6 = new BasicDomain( "d4", 4, 5, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final List<Boolean> covered = new ArrayList<Boolean>();
+ covered.add( true ); // 0
+ covered.add( false ); // 1
+ covered.add( true ); // 2
+ covered.add( false ); // 3
+ covered.add( true ); // 4
+ covered.add( true ); // 5
+ covered.add( false ); // 6
+ covered.add( true ); // 7
+ covered.add( true ); // 8
+ if ( ForesterUtil.isEngulfed( d0, covered ) ) {
return false;
}
- final Sequence aa2 = BasicSequence.createAaSequence( "aa3", "ARNDCQEGHILKMFPSTWYVX*-BZOJU" );
- if ( !new String( aa2.getMolecularSequence() ).equals( "ARNDCQEGHILKMFPSTWYVX*-BZXXU" ) ) {
+ if ( ForesterUtil.isEngulfed( d1, covered ) ) {
return false;
}
- final Sequence dna1 = BasicSequence.createDnaSequence( "dna1", "ACGTUX*-?RYMKWSN" );
- if ( !new String( dna1.getMolecularSequence() ).equals( "ACGTNN*-NRYMKWSN" ) ) {
+ if ( ForesterUtil.isEngulfed( d2, covered ) ) {
return false;
}
- final Sequence rna1 = BasicSequence.createRnaSequence( "rna1", "..ACGUTX*-?RYMKWSN" );
- if ( !new String( rna1.getMolecularSequence() ).equals( "--ACGUNN*-NRYMKWSN" ) ) {
+ if ( !ForesterUtil.isEngulfed( d3, covered ) ) {
return false;
}
- }
- catch ( final Exception e ) {
- e.printStackTrace();
- return false;
- }
- return true;
- }
-
- private static boolean testBasicDomain() {
- try {
- final Domain pd = new BasicDomain( "id", 23, 25, ( short ) 1, ( short ) 4, 0.1, -12 );
- if ( !pd.getDomainId().getId().equals( "id" ) ) {
+ if ( ForesterUtil.isEngulfed( d4, covered ) ) {
return false;
}
- if ( pd.getNumber() != 1 ) {
+ if ( ForesterUtil.isEngulfed( d5, covered ) ) {
return false;
}
- if ( pd.getTotalCount() != 4 ) {
+ if ( !ForesterUtil.isEngulfed( d6, covered ) ) {
return false;
}
- if ( !pd.equals( new BasicDomain( "id", 22, 111, ( short ) 1, ( short ) 4, 0.2, -12 ) ) ) {
+ final Domain a = new BasicDomain( "a", 0, 10, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain b = new BasicDomain( "b", 8, 20, ( short ) 1, ( short ) 1, 0.2, 1 );
+ final Domain c = new BasicDomain( "c", 15, 16, ( short ) 1, ( short ) 1, 0.3, 1 );
+ final Protein abc = new BasicProtein( "abc", "nemve", 0 );
+ abc.addProteinDomain( a );
+ abc.addProteinDomain( b );
+ abc.addProteinDomain( c );
+ final Protein abc_r1 = ForesterUtil.removeOverlappingDomains( 3, false, abc );
+ final Protein abc_r2 = ForesterUtil.removeOverlappingDomains( 3, true, abc );
+ if ( abc.getNumberOfProteinDomains() != 3 ) {
return false;
}
- final Domain a1 = new BasicDomain( "a", 1, 10, ( short ) 1, ( short ) 4, 0.1, -12 );
- final BasicDomain a1_copy = new BasicDomain( "a", 1, 10, ( short ) 1, ( short ) 4, 0.1, -12 );
- final BasicDomain a1_equal = new BasicDomain( "a", 524, 743994, ( short ) 1, ( short ) 300, 3.0005, 230 );
- final BasicDomain a2 = new BasicDomain( "a", 1, 10, ( short ) 2, ( short ) 4, 0.1, -12 );
- final BasicDomain a3 = new BasicDomain( "A", 1, 10, ( short ) 1, ( short ) 4, 0.1, -12 );
- if ( !a1.equals( a1 ) ) {
+ if ( abc_r1.getNumberOfProteinDomains() != 3 ) {
return false;
}
- if ( !a1.equals( a1_copy ) ) {
+ if ( abc_r2.getNumberOfProteinDomains() != 2 ) {
return false;
}
- if ( !a1.equals( a1_equal ) ) {
+ if ( !abc_r2.getProteinDomain( 0 ).getDomainId().equals( "a" ) ) {
return false;
}
- if ( !a1.equals( a2 ) ) {
+ if ( !abc_r2.getProteinDomain( 1 ).getDomainId().equals( "b" ) ) {
return false;
}
- if ( a1.equals( a3 ) ) {
+ final Domain d = new BasicDomain( "d", 0, 10, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain e = new BasicDomain( "e", 8, 20, ( short ) 1, ( short ) 1, 0.3, 1 );
+ final Domain f = new BasicDomain( "f", 15, 16, ( short ) 1, ( short ) 1, 0.2, 1 );
+ final Protein def = new BasicProtein( "def", "nemve", 0 );
+ def.addProteinDomain( d );
+ def.addProteinDomain( e );
+ def.addProteinDomain( f );
+ final Protein def_r1 = ForesterUtil.removeOverlappingDomains( 5, false, def );
+ final Protein def_r2 = ForesterUtil.removeOverlappingDomains( 5, true, def );
+ if ( def.getNumberOfProteinDomains() != 3 ) {
return false;
}
- if ( a1.compareTo( a1 ) != 0 ) {
+ if ( def_r1.getNumberOfProteinDomains() != 3 ) {
return false;
}
- if ( a1.compareTo( a1_copy ) != 0 ) {
+ if ( def_r2.getNumberOfProteinDomains() != 3 ) {
return false;
}
- if ( a1.compareTo( a1_equal ) != 0 ) {
+ if ( !def_r2.getProteinDomain( 0 ).getDomainId().equals( "d" ) ) {
return false;
}
- if ( a1.compareTo( a2 ) != 0 ) {
+ if ( !def_r2.getProteinDomain( 1 ).getDomainId().equals( "f" ) ) {
return false;
}
- if ( a1.compareTo( a3 ) != 0 ) {
+ if ( !def_r2.getProteinDomain( 2 ).getDomainId().equals( "e" ) ) {
return false;
}
}
return true;
}
- private static boolean testBasicNodeMethods() {
+ public static final boolean testNHXparsingFromURL2() {
try {
- if ( PhylogenyNode.getNodeCount() != 0 ) {
+ final String s = "https://sites.google.com/site/cmzmasek/home/software/archaeopteryx/examples/simple/simple_1.nh";
+ final Phylogeny phys[] = AptxUtil.readPhylogeniesFromUrl( new URL( s ),
+ false,
+ false,
+ false,
+ TAXONOMY_EXTRACTION.NO,
+ false );
+ if ( ( phys == null ) || ( phys.length != 5 ) ) {
return false;
}
- final PhylogenyNode n1 = new PhylogenyNode();
- final PhylogenyNode n2 = PhylogenyNode
- .createInstanceFromNhxString( "", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_STRICT );
- final PhylogenyNode n3 = PhylogenyNode
- .createInstanceFromNhxString( "n3", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_STRICT );
- final PhylogenyNode n4 = PhylogenyNode
- .createInstanceFromNhxString( "n4:0.01", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_STRICT );
- if ( n1.isHasAssignedEvent() ) {
+ if ( !phys[ 0 ].toNewHampshire().equals( "((((A,B),C),D),(E,F));" ) ) {
+ System.out.println( phys[ 0 ].toNewHampshire() );
return false;
}
- if ( PhylogenyNode.getNodeCount() != 4 ) {
+ if ( !phys[ 1 ].toNewHampshire().equals( "((1,2,3),(4,5,6),(7,8,9));" ) ) {
+ System.out.println( phys[ 1 ].toNewHampshire() );
return false;
}
- if ( n3.getIndicator() != 0 ) {
+ final Phylogeny phys2[] = AptxUtil.readPhylogeniesFromUrl( new URL( s ),
+ false,
+ false,
+ false,
+ TAXONOMY_EXTRACTION.NO,
+ false );
+ if ( ( phys2 == null ) || ( phys2.length != 5 ) ) {
return false;
}
- if ( n3.getNumberOfExternalNodes() != 1 ) {
+ if ( !phys2[ 0 ].toNewHampshire().equals( "((((A,B),C),D),(E,F));" ) ) {
+ System.out.println( phys2[ 0 ].toNewHampshire() );
return false;
}
- if ( !n3.isExternal() ) {
+ if ( !phys2[ 1 ].toNewHampshire().equals( "((1,2,3),(4,5,6),(7,8,9));" ) ) {
+ System.out.println( phys2[ 1 ].toNewHampshire() );
return false;
}
- if ( !n3.isRoot() ) {
+ final Phylogeny phys3[] = AptxUtil.readPhylogeniesFromUrl( new URL( "http://swisstree.vital-it.ch:80/"
+ + "SwissTree/ST001/consensus_tree.nhx" ), false, false, false, TAXONOMY_EXTRACTION.NO, false );
+ if ( ( phys3 == null ) || ( phys3.length != 1 ) ) {
return false;
}
- if ( !n4.getName().equals( "n4" ) ) {
+ if ( !phys3[ 0 ]
+ .toNewHampshire()
+ .equals( "((((POP23a_CIOIN_ENSCING00000016202,POP23b_CIOIN_ENSCING00000016169),POP23_CIOSA_ENSCSAVG00000000248),((POP23a_BRAFL_C3ZMF1,POP23b_BRAFL_121417),(((POP3_ORYLA_ENSORLG00000019669,POP3_GASAC_ENSGACG00000014023,POP3_DANRE_Q6JWW1),(POP3_XENTR_B1H1F6,(POP3_CHICK_Q9DG25,(POP3_ORNAN_ENSOANG00000004179,POP3_MONDO_ENSMODG00000018033,((POP3_MOUSE_Q9ES81,POP3_RAT_Q3BCU3),POP3_RABIT_ENSOCUG00000025973,POP3_MACMU_ENSMMUG00000014473,POP3_HUMAN_Q9HBV1))))),(((POP2_GASAC_ENSGACG00000001420,POP2_ORYLA_ENSORLG00000008627,POP2_TAKRU_ENSTRUG00000015933),POP2_DANRE_ENSDARG00000069922),POP2_XENTR_ENSXETG00000018064,(((POP2_TAEGU_ENSTGUG00000013383,POP2_CHICK_Q6T9Z5),POP2_ANOCA_ENSACAG00000003557),((POP2_MACEU_ENSMEUG00000015825,POP2_MONDO_ENSMODG00000018205),((POP2_RABIT_ENSOCUG00000009515,(POP2_RAT_Q6P722,POP2_MOUSE_Q9ES82)),(POP2_MACMU_ENSMMUG00000000905,POP2_HUMAN_Q9HBU9)))))))),((POP1_CIOSA_ENSCSAVG00000000247,POP1_CIOIN_ENSCING00000000496),((POP1_DANRE_Q5PQZ7,(POP1_ORYLA_ENSORLG00000019663,POP1_GASAC_ENSGACG00000014015,POP1_TAKRU_ENSORLG00000019663)),(POP1_XENTR_B1H1G2,(POP1_ANOCA_ENSACAG00000003910,(POP1_TAEGU_ENSTGUG00000012218,POP1_CHICK_Q9DG23)),POP1_ORNAN_ENSOANG00000004180,POP1_MONDO_ENSMODG00000018034,(POP1_RABIT_ENSOCUG00000016944,(POP1_RAT_Q3BCU4,POP1_MOUSE_Q9ES83),(POP1_HUMAN_Q8NE79,POP1_MACMU_ENSMMUG00000014471))))));" ) ) {
+ System.out.println( phys3[ 0 ].toNewHampshire() );
+ return false;
+ }
+ final Phylogeny phys4[] = AptxUtil.readPhylogeniesFromUrl( new URL( "http://swisstree.vital-it.ch:80/"
+ + "SwissTree/ST001/consensus_tree.nhx" ), false, false, false, TAXONOMY_EXTRACTION.NO, false );
+ if ( ( phys4 == null ) || ( phys4.length != 1 ) ) {
+ return false;
+ }
+ if ( !phys4[ 0 ]
+ .toNewHampshire()
+ .equals( "((((POP23a_CIOIN_ENSCING00000016202,POP23b_CIOIN_ENSCING00000016169),POP23_CIOSA_ENSCSAVG00000000248),((POP23a_BRAFL_C3ZMF1,POP23b_BRAFL_121417),(((POP3_ORYLA_ENSORLG00000019669,POP3_GASAC_ENSGACG00000014023,POP3_DANRE_Q6JWW1),(POP3_XENTR_B1H1F6,(POP3_CHICK_Q9DG25,(POP3_ORNAN_ENSOANG00000004179,POP3_MONDO_ENSMODG00000018033,((POP3_MOUSE_Q9ES81,POP3_RAT_Q3BCU3),POP3_RABIT_ENSOCUG00000025973,POP3_MACMU_ENSMMUG00000014473,POP3_HUMAN_Q9HBV1))))),(((POP2_GASAC_ENSGACG00000001420,POP2_ORYLA_ENSORLG00000008627,POP2_TAKRU_ENSTRUG00000015933),POP2_DANRE_ENSDARG00000069922),POP2_XENTR_ENSXETG00000018064,(((POP2_TAEGU_ENSTGUG00000013383,POP2_CHICK_Q6T9Z5),POP2_ANOCA_ENSACAG00000003557),((POP2_MACEU_ENSMEUG00000015825,POP2_MONDO_ENSMODG00000018205),((POP2_RABIT_ENSOCUG00000009515,(POP2_RAT_Q6P722,POP2_MOUSE_Q9ES82)),(POP2_MACMU_ENSMMUG00000000905,POP2_HUMAN_Q9HBU9)))))))),((POP1_CIOSA_ENSCSAVG00000000247,POP1_CIOIN_ENSCING00000000496),((POP1_DANRE_Q5PQZ7,(POP1_ORYLA_ENSORLG00000019663,POP1_GASAC_ENSGACG00000014015,POP1_TAKRU_ENSORLG00000019663)),(POP1_XENTR_B1H1G2,(POP1_ANOCA_ENSACAG00000003910,(POP1_TAEGU_ENSTGUG00000012218,POP1_CHICK_Q9DG23)),POP1_ORNAN_ENSOANG00000004180,POP1_MONDO_ENSMODG00000018034,(POP1_RABIT_ENSOCUG00000016944,(POP1_RAT_Q3BCU4,POP1_MOUSE_Q9ES83),(POP1_HUMAN_Q8NE79,POP1_MACMU_ENSMMUG00000014471))))));" ) ) {
+ System.out.println( phys4[ 0 ].toNewHampshire() );
return false;
}
}
catch ( final Exception e ) {
- e.printStackTrace( System.out );
+ e.printStackTrace();
return false;
}
return true;
}
- private static boolean testBasicPhyloXMLparsing() {
+ public static final boolean testNHXparsingFromURL() {
try {
+ final String s = "https://sites.google.com/site/cmzmasek/home/software/archaeopteryx/examples/simple/simple_1.nh";
+ final URL u = new URL( s );
final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
- final PhyloXmlParser xml_parser = new PhyloXmlParser();
- final Phylogeny[] phylogenies_0 = factory.create( Test.PATH_TO_TEST_DATA + "phyloxml_test_t1.xml",
- xml_parser );
- if ( xml_parser.getErrorCount() > 0 ) {
- System.out.println( xml_parser.getErrorMessages().toString() );
+ final Phylogeny[] phys = factory.create( u, new NHXParser() );
+ if ( ( phys == null ) || ( phys.length != 5 ) ) {
return false;
}
- if ( phylogenies_0.length != 4 ) {
+ if ( !phys[ 0 ].toNewHampshire().equals( "((((A,B),C),D),(E,F));" ) ) {
+ System.out.println( phys[ 0 ].toNewHampshire() );
return false;
}
- final Phylogeny t1 = phylogenies_0[ 0 ];
- final Phylogeny t2 = phylogenies_0[ 1 ];
- final Phylogeny t3 = phylogenies_0[ 2 ];
- final Phylogeny t4 = phylogenies_0[ 3 ];
- if ( t1.getNumberOfExternalNodes() != 1 ) {
+ if ( !phys[ 1 ].toNewHampshire().equals( "((1,2,3),(4,5,6),(7,8,9));" ) ) {
+ System.out.println( phys[ 1 ].toNewHampshire() );
return false;
}
- if ( !t1.isRooted() ) {
+ final URL u2 = new URL( s );
+ final Phylogeny[] phys2 = factory.create( u2.openStream(), new NHXParser() );
+ if ( ( phys2 == null ) || ( phys2.length != 5 ) ) {
return false;
}
- if ( t1.isRerootable() ) {
+ if ( !phys2[ 0 ].toNewHampshire().equals( "((((A,B),C),D),(E,F));" ) ) {
+ System.out.println( phys2[ 0 ].toNewHampshire() );
return false;
}
- if ( !t1.getType().equals( "gene_tree" ) ) {
+ final PhylogenyFactory factory2 = ParserBasedPhylogenyFactory.getInstance();
+ final NHXParser p = new NHXParser();
+ final URL u3 = new URL( s );
+ p.setSource( u3 );
+ if ( !p.hasNext() ) {
return false;
}
- if ( t2.getNumberOfExternalNodes() != 2 ) {
+ if ( !p.next().toNewHampshire().equals( "((((A,B),C),D),(E,F));" ) ) {
return false;
}
- if ( !isEqual( t2.getNode( "node a" ).getDistanceToParent(), 1.0 ) ) {
+ if ( !p.hasNext() ) {
return false;
}
- if ( !isEqual( t2.getNode( "node b" ).getDistanceToParent(), 2.0 ) ) {
- return false;
+ p.reset();
+ if ( !p.hasNext() ) {
+ return false;
+ }
+ if ( !p.next().toNewHampshire().equals( "((((A,B),C),D),(E,F));" ) ) {
+ return false;
+ }
+ if ( !p.next().toNewHampshire().equals( "((1,2,3),(4,5,6),(7,8,9));" ) ) {
+ return false;
+ }
+ p.reset();
+ if ( !p.hasNext() ) {
+ return false;
+ }
+ if ( !p.next().toNewHampshire().equals( "((((A,B),C),D),(E,F));" ) ) {
+ return false;
+ }
+ if ( !p.next().toNewHampshire().equals( "((1,2,3),(4,5,6),(7,8,9));" ) ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ System.out.println( e.toString() );
+ e.printStackTrace();
+ return false;
+ }
+ return true;
+ }
+
+ public static boolean testOverlapRemoval() {
+ try {
+ final Domain d0 = new BasicDomain( "d0", ( short ) 2, ( short ) 5, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d1 = new BasicDomain( "d1", ( short ) 7, ( short ) 10, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d2 = new BasicDomain( "d2", ( short ) 0, ( short ) 20, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d3 = new BasicDomain( "d3", ( short ) 9, ( short ) 10, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final Domain d4 = new BasicDomain( "d4", ( short ) 7, ( short ) 8, ( short ) 1, ( short ) 1, 0.1, 1 );
+ final List<Boolean> covered = new ArrayList<Boolean>();
+ covered.add( true ); // 0
+ covered.add( false ); // 1
+ covered.add( true ); // 2
+ covered.add( false ); // 3
+ covered.add( true ); // 4
+ covered.add( true ); // 5
+ covered.add( false ); // 6
+ covered.add( true ); // 7
+ covered.add( true ); // 8
+ if ( ForesterUtil.calculateOverlap( d0, covered ) != 3 ) {
+ return false;
+ }
+ if ( ForesterUtil.calculateOverlap( d1, covered ) != 2 ) {
+ return false;
+ }
+ if ( ForesterUtil.calculateOverlap( d2, covered ) != 6 ) {
+ return false;
+ }
+ if ( ForesterUtil.calculateOverlap( d3, covered ) != 0 ) {
+ return false;
+ }
+ if ( ForesterUtil.calculateOverlap( d4, covered ) != 2 ) {
+ return false;
+ }
+ final Domain a = new BasicDomain( "a", ( short ) 2, ( short ) 5, ( short ) 1, ( short ) 1, 1, -1 );
+ final Domain b = new BasicDomain( "b", ( short ) 2, ( short ) 10, ( short ) 1, ( short ) 1, 0.1, -1 );
+ final Protein ab = new BasicProtein( "ab", "varanus", 0 );
+ ab.addProteinDomain( a );
+ ab.addProteinDomain( b );
+ final Protein ab_s0 = ForesterUtil.removeOverlappingDomains( 3, false, ab );
+ if ( ab.getNumberOfProteinDomains() != 2 ) {
+ return false;
+ }
+ if ( ab_s0.getNumberOfProteinDomains() != 1 ) {
+ return false;
+ }
+ if ( !ab_s0.getProteinDomain( 0 ).getDomainId().equals( "b" ) ) {
+ return false;
+ }
+ final Protein ab_s1 = ForesterUtil.removeOverlappingDomains( 4, false, ab );
+ if ( ab.getNumberOfProteinDomains() != 2 ) {
+ return false;
+ }
+ if ( ab_s1.getNumberOfProteinDomains() != 2 ) {
+ return false;
+ }
+ final Domain c = new BasicDomain( "c", ( short ) 20000, ( short ) 20500, ( short ) 1, ( short ) 1, 10, 1 );
+ final Domain d = new BasicDomain( "d",
+ ( short ) 10000,
+ ( short ) 10500,
+ ( short ) 1,
+ ( short ) 1,
+ 0.0000001,
+ 1 );
+ final Domain e = new BasicDomain( "e", ( short ) 5000, ( short ) 5500, ( short ) 1, ( short ) 1, 0.0001, 1 );
+ final Protein cde = new BasicProtein( "cde", "varanus", 0 );
+ cde.addProteinDomain( c );
+ cde.addProteinDomain( d );
+ cde.addProteinDomain( e );
+ final Protein cde_s0 = ForesterUtil.removeOverlappingDomains( 0, false, cde );
+ if ( cde.getNumberOfProteinDomains() != 3 ) {
+ return false;
+ }
+ if ( cde_s0.getNumberOfProteinDomains() != 3 ) {
+ return false;
+ }
+ final Domain f = new BasicDomain( "f", ( short ) 10, ( short ) 20, ( short ) 1, ( short ) 1, 10, 1 );
+ final Domain g = new BasicDomain( "g", ( short ) 10, ( short ) 20, ( short ) 1, ( short ) 1, 0.01, 1 );
+ final Domain h = new BasicDomain( "h", ( short ) 10, ( short ) 20, ( short ) 1, ( short ) 1, 0.0001, 1 );
+ final Domain i = new BasicDomain( "i", ( short ) 10, ( short ) 20, ( short ) 1, ( short ) 1, 0.5, 1 );
+ final Domain i2 = new BasicDomain( "i", ( short ) 5, ( short ) 30, ( short ) 1, ( short ) 1, 0.5, 10 );
+ final Protein fghi = new BasicProtein( "fghi", "varanus", 0 );
+ fghi.addProteinDomain( f );
+ fghi.addProteinDomain( g );
+ fghi.addProteinDomain( h );
+ fghi.addProteinDomain( i );
+ fghi.addProteinDomain( i );
+ fghi.addProteinDomain( i );
+ fghi.addProteinDomain( i2 );
+ final Protein fghi_s0 = ForesterUtil.removeOverlappingDomains( 10, false, fghi );
+ if ( fghi.getNumberOfProteinDomains() != 7 ) {
+ return false;
+ }
+ if ( fghi_s0.getNumberOfProteinDomains() != 1 ) {
+ return false;
+ }
+ if ( !fghi_s0.getProteinDomain( 0 ).getDomainId().equals( "h" ) ) {
+ return false;
+ }
+ final Protein fghi_s1 = ForesterUtil.removeOverlappingDomains( 11, false, fghi );
+ if ( fghi.getNumberOfProteinDomains() != 7 ) {
+ return false;
+ }
+ if ( fghi_s1.getNumberOfProteinDomains() != 7 ) {
+ return false;
+ }
+ final Domain j = new BasicDomain( "j", ( short ) 10, ( short ) 20, ( short ) 1, ( short ) 1, 10, 1 );
+ final Domain k = new BasicDomain( "k", ( short ) 10, ( short ) 20, ( short ) 1, ( short ) 1, 0.01, 1 );
+ final Domain l = new BasicDomain( "l", ( short ) 10, ( short ) 20, ( short ) 1, ( short ) 1, 0.0001, 1 );
+ final Domain m = new BasicDomain( "m", ( short ) 10, ( short ) 20, ( short ) 1, ( short ) 4, 0.5, 1 );
+ final Domain m0 = new BasicDomain( "m", ( short ) 10, ( short ) 20, ( short ) 2, ( short ) 4, 0.5, 1 );
+ final Domain m1 = new BasicDomain( "m", ( short ) 10, ( short ) 20, ( short ) 3, ( short ) 4, 0.5, 1 );
+ final Domain m2 = new BasicDomain( "m", ( short ) 5, ( short ) 30, ( short ) 4, ( short ) 4, 0.5, 10 );
+ final Protein jklm = new BasicProtein( "jklm", "varanus", 0 );
+ jklm.addProteinDomain( j );
+ jklm.addProteinDomain( k );
+ jklm.addProteinDomain( l );
+ jklm.addProteinDomain( m );
+ jklm.addProteinDomain( m0 );
+ jklm.addProteinDomain( m1 );
+ jklm.addProteinDomain( m2 );
+ final Protein jklm_s0 = ForesterUtil.removeOverlappingDomains( 10, false, jklm );
+ if ( jklm.getNumberOfProteinDomains() != 7 ) {
+ return false;
+ }
+ if ( jklm_s0.getNumberOfProteinDomains() != 1 ) {
+ return false;
+ }
+ if ( !jklm_s0.getProteinDomain( 0 ).getDomainId().equals( "l" ) ) {
+ return false;
+ }
+ final Protein jklm_s1 = ForesterUtil.removeOverlappingDomains( 11, false, jklm );
+ if ( jklm.getNumberOfProteinDomains() != 7 ) {
+ return false;
+ }
+ if ( jklm_s1.getNumberOfProteinDomains() != 7 ) {
+ return false;
+ }
+ final Domain only = new BasicDomain( "only", ( short ) 5, ( short ) 30, ( short ) 4, ( short ) 4, 0.5, 10 );
+ final Protein od = new BasicProtein( "od", "varanus", 0 );
+ od.addProteinDomain( only );
+ final Protein od_s0 = ForesterUtil.removeOverlappingDomains( 0, false, od );
+ if ( od.getNumberOfProteinDomains() != 1 ) {
+ return false;
+ }
+ if ( od_s0.getNumberOfProteinDomains() != 1 ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace( System.out );
+ return false;
+ }
+ return true;
+ }
+
+ public static final boolean testPfamTreeReading() {
+ try {
+ final URL u = new URL( WebserviceUtil.PFAM_SERVER + "/family/PF" + "01849" + "/tree/download" );
+ final NHXParser parser = new NHXParser();
+ parser.setTaxonomyExtraction( NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_STRICT );
+ parser.setReplaceUnderscores( false );
+ parser.setGuessRootedness( true );
+ final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
+ final Phylogeny[] phys = factory.create( u.openStream(), parser );
+ if ( ( phys == null ) || ( phys.length != 1 ) ) {
+ return false;
+ }
+ if ( phys[ 0 ].getNumberOfExternalNodes() < 10 ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace();
+ }
+ return true;
+ }
+
+ public static final boolean testPhyloXMLparsingFromURL() {
+ try {
+ final String s = "https://sites.google.com/site/cmzmasek/home/software/archaeopteryx/examples/archaeopteryx_a/apaf_bcl2.xml";
+ final URL u = new URL( s );
+ final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
+ final Phylogeny[] phys = factory.create( u.openStream(), PhyloXmlParser.createPhyloXmlParser() );
+ if ( ( phys == null ) || ( phys.length != 2 ) ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace();
+ }
+ return true;
+ }
+
+ public static final boolean testToLReading() {
+ try {
+ final URL u = new URL( WebserviceUtil.TOL_URL_BASE + "15079" );
+ final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
+ final Phylogeny[] phys = factory.create( u.openStream(), new TolParser() );
+ if ( ( phys == null ) || ( phys.length != 1 ) ) {
+ return false;
+ }
+ if ( !phys[ 0 ].getRoot().getNodeData().getTaxonomy().getIdentifier().getValue().equals( "15079" ) ) {
+ return false;
+ }
+ if ( !phys[ 0 ].getRoot().getNodeData().getTaxonomy().getScientificName().equals( "Protacanthopterygii" ) ) {
+ return false;
+ }
+ if ( phys[ 0 ].getNumberOfExternalNodes() < 5 ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace();
+ }
+ return true;
+ }
+
+ public static final boolean testTreeBaseReading() {
+ try {
+ final URL u = new URL( WebserviceUtil.TREEBASE_PHYLOWS_TREE_URL_BASE + "825?format=nexus" );
+ final NexusPhylogeniesParser parser = new NexusPhylogeniesParser();
+ parser.setReplaceUnderscores( true );
+ final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
+ final Phylogeny[] phys = factory.create( u.openStream(), parser );
+ if ( ( phys == null ) || ( phys.length != 1 ) ) {
+ return false;
+ }
+ final URL u2 = new URL( WebserviceUtil.TREEBASE_PHYLOWS_STUDY_URL_BASE + "15613?format=nexus" );
+ final NexusPhylogeniesParser parser2 = new NexusPhylogeniesParser();
+ parser2.setReplaceUnderscores( true );
+ final PhylogenyFactory factory2 = ParserBasedPhylogenyFactory.getInstance();
+ final Phylogeny[] phys2 = factory2.create( u2.openStream(), parser2 );
+ if ( ( phys2 == null ) || ( phys2.length != 9 ) ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace();
+ }
+ return true;
+ }
+
+ public static final boolean testTreeFamReading() {
+ try {
+ final URL u = new URL( WebserviceUtil.TREE_FAM_URL_BASE + "101004" + "/tree/newick" );
+ final NHXParser parser = new NHXParser();
+ parser.setTaxonomyExtraction( NHXParser.TAXONOMY_EXTRACTION.NO );
+ parser.setReplaceUnderscores( false );
+ parser.setGuessRootedness( true );
+ final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
+ final Phylogeny[] phys = factory.create( u.openStream(), parser );
+ if ( ( phys == null ) || ( phys.length != 1 ) ) {
+ return false;
+ }
+ if ( phys[ 0 ].getNumberOfExternalNodes() < 10 ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace();
+ }
+ return true;
+ }
+
+ private final static Phylogeny createPhylogeny( final String nhx ) throws IOException {
+ final Phylogeny p = ParserBasedPhylogenyFactory.getInstance().create( nhx, new NHXParser() )[ 0 ];
+ return p;
+ }
+
+ private final static Event getEvent( final Phylogeny p, final String n1, final String n2 ) {
+ return PhylogenyMethods.calculateLCA( p.getNode( n1 ), p.getNode( n2 ) ).getNodeData().getEvent();
+ }
+
+ private static boolean testAminoAcidSequence() {
+ try {
+ final MolecularSequence aa1 = BasicSequence.createAaSequence( "aa1", "aAklm-?xX*z$#" );
+ if ( aa1.getLength() != 13 ) {
+ return false;
+ }
+ if ( aa1.getResidueAt( 0 ) != 'A' ) {
+ return false;
+ }
+ if ( aa1.getResidueAt( 2 ) != 'K' ) {
+ return false;
+ }
+ if ( !new String( aa1.getMolecularSequence() ).equals( "AAKLM-XXX*ZXX" ) ) {
+ return false;
+ }
+ final MolecularSequence aa2 = BasicSequence.createAaSequence( "aa3", "ARNDCQEGHILKMFPSTWYVX*-BZOJU" );
+ if ( !new String( aa2.getMolecularSequence() ).equals( "ARNDCQEGHILKMFPSTWYVX*-BZOXU" ) ) {
+ return false;
+ }
+ final MolecularSequence dna1 = BasicSequence.createDnaSequence( "dna1", "ACGTUX*-?RYMKWSN" );
+ if ( !new String( dna1.getMolecularSequence() ).equals( "ACGTNN*-NRYMKWSN" ) ) {
+ return false;
+ }
+ final MolecularSequence rna1 = BasicSequence.createRnaSequence( "rna1", "..ACGUTX*-?RYMKWSN" );
+ if ( !new String( rna1.getMolecularSequence() ).equals( "--ACGUNN*-NRYMKWSN" ) ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace();
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testBasicDomain() {
+ try {
+ final Domain pd = new BasicDomain( "id", 23, 25, ( short ) 1, ( short ) 4, 0.1, -12 );
+ if ( !pd.getDomainId().equals( "id" ) ) {
+ return false;
+ }
+ if ( pd.getNumber() != 1 ) {
+ return false;
+ }
+ if ( pd.getTotalCount() != 4 ) {
+ return false;
+ }
+ if ( !pd.equals( new BasicDomain( "id", 22, 111, ( short ) 1, ( short ) 4, 0.2, -12 ) ) ) {
+ return false;
+ }
+ final Domain a1 = new BasicDomain( "a", 1, 10, ( short ) 1, ( short ) 4, 0.1, -12 );
+ final BasicDomain a1_copy = new BasicDomain( "a", 1, 10, ( short ) 1, ( short ) 4, 0.1, -12 );
+ final BasicDomain a1_equal = new BasicDomain( "a", 524, 743994, ( short ) 1, ( short ) 300, 3.0005, 230 );
+ final BasicDomain a2 = new BasicDomain( "a", 1, 10, ( short ) 2, ( short ) 4, 0.1, -12 );
+ final BasicDomain a3 = new BasicDomain( "A", 1, 10, ( short ) 1, ( short ) 4, 0.1, -12 );
+ if ( !a1.equals( a1 ) ) {
+ return false;
+ }
+ if ( !a1.equals( a1_copy ) ) {
+ return false;
+ }
+ if ( !a1.equals( a1_equal ) ) {
+ return false;
+ }
+ if ( !a1.equals( a2 ) ) {
+ return false;
+ }
+ if ( a1.equals( a3 ) ) {
+ return false;
+ }
+ if ( a1.compareTo( a1 ) != 0 ) {
+ return false;
+ }
+ if ( a1.compareTo( a1_copy ) != 0 ) {
+ return false;
+ }
+ if ( a1.compareTo( a1_equal ) != 0 ) {
+ return false;
+ }
+ if ( a1.compareTo( a2 ) != 0 ) {
+ return false;
+ }
+ if ( a1.compareTo( a3 ) == 0 ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace( System.out );
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testBasicNodeMethods() {
+ try {
+ if ( PhylogenyNode.getNodeCount() != 0 ) {
+ return false;
+ }
+ final PhylogenyNode n1 = new PhylogenyNode();
+ final PhylogenyNode n2 = PhylogenyNode
+ .createInstanceFromNhxString( "", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_STRICT );
+ final PhylogenyNode n3 = PhylogenyNode
+ .createInstanceFromNhxString( "n3", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_STRICT );
+ final PhylogenyNode n4 = PhylogenyNode
+ .createInstanceFromNhxString( "n4:0.01", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_STRICT );
+ if ( n1.isHasAssignedEvent() ) {
+ return false;
+ }
+ if ( PhylogenyNode.getNodeCount() != 4 ) {
+ return false;
+ }
+ if ( n3.getIndicator() != 0 ) {
+ return false;
+ }
+ if ( n3.getNumberOfExternalNodes() != 1 ) {
+ return false;
+ }
+ if ( !n3.isExternal() ) {
+ return false;
+ }
+ if ( !n3.isRoot() ) {
+ return false;
+ }
+ if ( !n4.getName().equals( "n4" ) ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace( System.out );
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testBasicPhyloXMLparsing() {
+ try {
+ final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
+ final PhyloXmlParser xml_parser = PhyloXmlParser.createPhyloXmlParser();
+ final Phylogeny[] phylogenies_0 = factory.create( Test.PATH_TO_TEST_DATA + "phyloxml_test_t1.xml",
+ xml_parser );
+ if ( xml_parser.getErrorCount() > 0 ) {
+ System.out.println( xml_parser.getErrorMessages().toString() );
+ return false;
+ }
+ if ( phylogenies_0.length != 4 ) {
+ return false;
+ }
+ final Phylogeny t1 = phylogenies_0[ 0 ];
+ final Phylogeny t2 = phylogenies_0[ 1 ];
+ final Phylogeny t3 = phylogenies_0[ 2 ];
+ final Phylogeny t4 = phylogenies_0[ 3 ];
+ if ( t1.getNumberOfExternalNodes() != 1 ) {
+ return false;
+ }
+ if ( !t1.isRooted() ) {
+ return false;
+ }
+ if ( t1.isRerootable() ) {
+ return false;
+ }
+ if ( !t1.getType().equals( "gene_tree" ) ) {
+ return false;
+ }
+ if ( t2.getNumberOfExternalNodes() != 2 ) {
+ return false;
+ }
+ if ( !isEqual( t2.getNode( "node a" ).getDistanceToParent(), 1.0 ) ) {
+ return false;
+ }
+ if ( !isEqual( t2.getNode( "node b" ).getDistanceToParent(), 2.0 ) ) {
+ return false;
}
if ( t2.getNode( "node a" ).getNodeData().getTaxonomies().size() != 2 ) {
return false;
if ( !t3.getIdentifier().getProvider().equals( "treebank" ) ) {
return false;
}
+ if ( !t3.getNode( "root node" ).isDuplication() ) {
+ return false;
+ }
+ if ( !t3.getNode( "node a" ).isDuplication() ) {
+ return false;
+ }
+ if ( t3.getNode( "node a" ).isSpeciation() ) {
+ return false;
+ }
+ if ( t3.getNode( "node bc" ).isDuplication() ) {
+ return false;
+ }
+ if ( !t3.getNode( "node bc" ).isSpeciation() ) {
+ return false;
+ }
if ( !t3.getNode( "root node" ).getNodeData().getSequence().getType().equals( "protein" ) ) {
return false;
}
if ( !( t3.getNode( "root node" ).getNodeData().getSequence().getLocation().equals( "12p13-p12" ) ) ) {
return false;
}
+ final SortedSet<Accession> x = t3.getNode( "root node" ).getNodeData().getSequence().getCrossReferences();
+ if ( x.size() != 4 ) {
+ return false;
+ }
+ int c = 0;
+ for( final Accession acc : x ) {
+ if ( c == 0 ) {
+ if ( !acc.getSource().equals( "KEGG" ) ) {
+ return false;
+ }
+ if ( !acc.getValue().equals( "hsa:596" ) ) {
+ return false;
+ }
+ }
+ c++;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
private static boolean testBasicPhyloXMLparsingRoundtrip() {
try {
final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
- final PhyloXmlParser xml_parser = new PhyloXmlParser();
+ final PhyloXmlParser xml_parser = PhyloXmlParser.createPhyloXmlParser();
if ( USE_LOCAL_PHYLOXML_SCHEMA ) {
xml_parser.setValidateAgainstSchema( PHYLOXML_LOCAL_XSD );
}
return false;
}
if ( t3_rt.getNode( "node bc" ).getNodeData().getSequence().getDomainArchitecture().getDomain( 0 )
- .getConfidence() != 2144 ) {
+ .getConfidence() != 0 ) {
return false;
}
if ( !t3_rt.getNode( "node bc" ).getNodeData().getSequence().getDomainArchitecture().getDomain( 0 ).getId()
}
if ( ( ( BinaryCharacters ) t3_rt.getNode( "node bb" ).getNodeData().getBinaryCharacters().copy() )
.getLostCount() != BinaryCharacters.COUNT_DEFAULT ) {
- ;
return false;
}
if ( t3_rt.getNode( "node b" ).getNodeData().getBinaryCharacters().getGainedCount() != 1 ) {
if ( !t3_rt.getNode( "node b" ).getNodeData().getBinaryCharacters().getType().equals( "characters" ) ) {
return false;
}
- //
if ( !t3_rt.getNode( "node ba" ).getNodeData().getDate().getDesc().equals( "Silurian" ) ) {
return false;
}
.equalsIgnoreCase( "433" ) ) {
return false;
}
+ final SortedSet<Accession> x = t3_rt.getNode( "root node" ).getNodeData().getSequence()
+ .getCrossReferences();
+ if ( x.size() != 4 ) {
+ return false;
+ }
+ int c = 0;
+ for( final Accession acc : x ) {
+ if ( c == 0 ) {
+ if ( !acc.getSource().equals( "KEGG" ) ) {
+ return false;
+ }
+ if ( !acc.getValue().equals( "hsa:596" ) ) {
+ return false;
+ }
+ }
+ c++;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
// Do nothing -- means were not running from jar.
}
if ( xml_parser == null ) {
- xml_parser = new PhyloXmlParser();
+ xml_parser = PhyloXmlParser.createPhyloXmlParser();
if ( USE_LOCAL_PHYLOXML_SCHEMA ) {
xml_parser.setValidateAgainstSchema( PHYLOXML_LOCAL_XSD );
}
p.addProteinDomain( A20 );
p.addProteinDomain( B25 );
p.addProteinDomain( D80 );
- List<DomainId> domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "C" ) );
+ List<String> domains_ids = new ArrayList<String>();
+ domains_ids.add( "A" );
+ domains_ids.add( "B" );
+ domains_ids.add( "C" );
if ( !p.contains( domains_ids, false ) ) {
return false;
}
if ( !p.contains( domains_ids, true ) ) {
return false;
}
- domains_ids.add( new DomainId( "X" ) );
+ domains_ids.add( "X" );
if ( p.contains( domains_ids, false ) ) {
return false;
}
if ( p.contains( domains_ids, true ) ) {
return false;
}
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "D" ) );
+ domains_ids = new ArrayList<String>();
+ domains_ids.add( "A" );
+ domains_ids.add( "C" );
+ domains_ids.add( "D" );
if ( !p.contains( domains_ids, false ) ) {
return false;
}
if ( !p.contains( domains_ids, true ) ) {
return false;
}
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "D" ) );
- domains_ids.add( new DomainId( "C" ) );
+ domains_ids = new ArrayList<String>();
+ domains_ids.add( "A" );
+ domains_ids.add( "D" );
+ domains_ids.add( "C" );
if ( !p.contains( domains_ids, false ) ) {
return false;
}
if ( p.contains( domains_ids, true ) ) {
return false;
}
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- if ( !p.contains( domains_ids, false ) ) {
- return false;
- }
- if ( !p.contains( domains_ids, true ) ) {
- return false;
- }
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
+ domains_ids = new ArrayList<String>();
+ domains_ids.add( "A" );
+ domains_ids.add( "A" );
+ domains_ids.add( "B" );
if ( !p.contains( domains_ids, false ) ) {
return false;
}
if ( !p.contains( domains_ids, true ) ) {
return false;
}
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- if ( !p.contains( domains_ids, false ) ) {
- return false;
- }
- if ( !p.contains( domains_ids, true ) ) {
- return false;
- }
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- if ( !p.contains( domains_ids, false ) ) {
- return false;
- }
- if ( p.contains( domains_ids, true ) ) {
- return false;
- }
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "D" ) );
- if ( !p.contains( domains_ids, false ) ) {
- return false;
- }
- if ( !p.contains( domains_ids, true ) ) {
- return false;
- }
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "D" ) );
- if ( !p.contains( domains_ids, false ) ) {
- return false;
- }
- if ( !p.contains( domains_ids, true ) ) {
- return false;
- }
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "D" ) );
- if ( !p.contains( domains_ids, false ) ) {
- return false;
- }
- if ( p.contains( domains_ids, true ) ) {
- return false;
- }
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "D" ) );
- if ( !p.contains( domains_ids, false ) ) {
- return false;
- }
- if ( p.contains( domains_ids, true ) ) {
- return false;
- }
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "D" ) );
+ domains_ids = new ArrayList<String>();
+ domains_ids.add( "A" );
+ domains_ids.add( "A" );
+ domains_ids.add( "A" );
+ domains_ids.add( "B" );
+ domains_ids.add( "B" );
if ( !p.contains( domains_ids, false ) ) {
return false;
}
if ( !p.contains( domains_ids, true ) ) {
return false;
}
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "D" ) );
- domains_ids.add( new DomainId( "X" ) );
- if ( p.contains( domains_ids, false ) ) {
- return false;
- }
- if ( p.contains( domains_ids, true ) ) {
- return false;
- }
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "X" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "D" ) );
- if ( p.contains( domains_ids, false ) ) {
- return false;
- }
- if ( p.contains( domains_ids, true ) ) {
- return false;
- }
- domains_ids = new ArrayList<DomainId>();
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "B" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "A" ) );
- domains_ids.add( new DomainId( "C" ) );
- domains_ids.add( new DomainId( "D" ) );
+ domains_ids = new ArrayList<String>();
+ domains_ids.add( "A" );
+ domains_ids.add( "A" );
+ domains_ids.add( "B" );
+ domains_ids.add( "A" );
+ domains_ids.add( "B" );
+ domains_ids.add( "B" );
+ domains_ids.add( "A" );
+ domains_ids.add( "B" );
+ domains_ids.add( "C" );
+ domains_ids.add( "A" );
+ domains_ids.add( "C" );
+ domains_ids.add( "D" );
if ( !p.contains( domains_ids, false ) ) {
return false;
}
private static boolean testBasicTreeMethods() {
try {
final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
- final Phylogeny t1 = factory.create();
- if ( !t1.isEmpty() ) {
- return false;
- }
final Phylogeny t2 = factory.create( "((A:1,B:2)AB:1,(C:3,D:5)CD:3)ABCD:0.5", new NHXParser() )[ 0 ];
if ( t2.getNumberOfExternalNodes() != 4 ) {
return false;
if ( !isEqual( t_bx.getNode( "acd" ).getBranchData().getConfidence( 0 ).getValue(), 1 ) ) {
return false;
}
- //
final Phylogeny[] t2 = factory
.create( "((((a,b),c),d),e);(((a,b),c),(d,e));(((((a,b),c),d),e),f);((((a,b),c),(d,e)),f);(((a,b),c),d,e);((a,b,c),d,e);",
new NHXParser() );
for( final Phylogeny target : t2 ) {
ConfidenceAssessor.evaluate( "bootstrap", ev2, target, false, 1 );
}
- //
final Phylogeny t4 = factory.create( "((((((A,B)ab,C)abc,D)abcd,E)abcde,F)abcdef,G)abcdefg",
new NHXParser() )[ 0 ];
final Phylogeny[] ev4 = factory.create( "(((A,B),C),(X,Y));((F,G),((A,B,C),(D,E)))", new NHXParser() );
try {
final PhylogenyNode n = new PhylogenyNode();
n.setName( "tr|B3RJ64" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.UNIPROT_KB + "B3RJ64" ) ) {
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.UNIPROT_KB + "B3RJ64" ) ) {
return false;
}
n.setName( "B0LM41_HUMAN" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.UNIPROT_KB + "B0LM41_HUMAN" ) ) {
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.UNIPROT_KB + "B0LM41_HUMAN" ) ) {
return false;
}
n.setName( "NP_001025424" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_PROTEIN + "NP_001025424" ) ) {
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_PROTEIN + "NP_001025424" ) ) {
return false;
}
n.setName( "_NM_001030253-" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_NUCCORE + "NM_001030253" ) ) {
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_NUCCORE + "NM_001030253" ) ) {
return false;
}
n.setName( "XM_002122186" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_NUCCORE + "XM_002122186" ) ) {
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_NUCCORE + "XM_002122186" ) ) {
return false;
}
n.setName( "dgh_AAA34956_gdg" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_PROTEIN + "AAA34956" ) ) {
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_PROTEIN + "AAA34956" ) ) {
return false;
}
- n.setName( "j40f4_Q06891.1_fndn2 fnr3" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_PROTEIN + "Q06891.1" ) ) {
+ n.setName( "AAA34956" );
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_PROTEIN + "AAA34956" ) ) {
return false;
}
n.setName( "GI:394892" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_GI + "394892" ) ) {
- System.out.println( AptxUtil.createUriForSeqWeb( n, null, null ) );
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_GI + "394892" ) ) {
+ System.out.println( TreePanelUtil.createUriForSeqWeb( n, null, null ) );
return false;
}
n.setName( "gi_394892" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_GI + "394892" ) ) {
- System.out.println( AptxUtil.createUriForSeqWeb( n, null, null ) );
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_GI + "394892" ) ) {
+ System.out.println( TreePanelUtil.createUriForSeqWeb( n, null, null ) );
return false;
}
n.setName( "gi6335_gi_394892_56635_Gi_43" );
- if ( !AptxUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_GI + "394892" ) ) {
- System.out.println( AptxUtil.createUriForSeqWeb( n, null, null ) );
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.NCBI_GI + "394892" ) ) {
+ System.out.println( TreePanelUtil.createUriForSeqWeb( n, null, null ) );
+ return false;
+ }
+ n.setName( "P12345" );
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.UNIPROT_KB + "P12345" ) ) {
+ System.out.println( TreePanelUtil.createUriForSeqWeb( n, null, null ) );
+ return false;
+ }
+ n.setName( "gi_fdgjmn-3jk5-243 mnefmn fg023-0 P12345 4395jtmnsrg02345m1ggi92450jrg890j4t0j240" );
+ if ( !TreePanelUtil.createUriForSeqWeb( n, null, null ).equals( ForesterUtil.UNIPROT_KB + "P12345" ) ) {
+ System.out.println( TreePanelUtil.createUriForSeqWeb( n, null, null ) );
return false;
}
}
if ( t4.getNumberOfExternalNodes() != 5 ) {
return false;
}
- String s = w.toNewHampshire( t4, false, true ).toString();
+ String s = w.toNewHampshire( t4, true ).toString();
if ( !s.equals( "((A,(B11,B12)),(C,D));" ) ) {
return false;
}
if ( !n.getName().equals( "D" ) ) {
return false;
}
- s = w.toNewHampshire( t4, false, true ).toString();
+ s = w.toNewHampshire( t4, true ).toString();
if ( !s.equals( "((A,B12),D);" ) ) {
return false;
}
if ( t5.getNumberOfExternalNodes() != 5 ) {
return false;
}
- s = w.toNewHampshire( t5, false, true ).toString();
+ s = w.toNewHampshire( t5, true ).toString();
if ( !s.equals( "(((B11,B12),B2),(C,D));" ) ) {
return false;
}
if ( t6.getNumberOfExternalNodes() != 5 ) {
return false;
}
- s = w.toNewHampshire( t6, false, false ).toString();
+ s = w.toNewHampshire( t6, false ).toString();
if ( !s.equals( "((A,(B12,B2)),(C,D));" ) ) {
return false;
}
if ( t7.getNumberOfExternalNodes() != 5 ) {
return false;
}
- s = w.toNewHampshire( t7, false, true ).toString();
+ s = w.toNewHampshire( t7, true ).toString();
if ( !s.equals( "((A,(B11,B2)),(C,D));" ) ) {
return false;
}
if ( t8.getNumberOfExternalNodes() != 5 ) {
return false;
}
- s = w.toNewHampshire( t8, false, false ).toString();
+ s = w.toNewHampshire( t8, false ).toString();
if ( !s.equals( "((A,(B11,B12)),(C,D));" ) ) {
return false;
}
if ( t9.getNumberOfExternalNodes() != 5 ) {
return false;
}
- s = w.toNewHampshire( t9, false, true ).toString();
+ s = w.toNewHampshire( t9, true ).toString();
if ( !s.equals( "((A,((B11,B12),B2)),D);" ) ) {
return false;
}
if ( t10.getNumberOfExternalNodes() != 5 ) {
return false;
}
- s = w.toNewHampshire( t10, false, true ).toString();
+ s = w.toNewHampshire( t10, true ).toString();
if ( !s.equals( "((A,((B11,B12),B2)),C);" ) ) {
return false;
}
if ( t11.getNumberOfExternalNodes() != 2 ) {
return false;
}
- s = w.toNewHampshire( t11, false, true ).toString();
+ s = w.toNewHampshire( t11, true ).toString();
if ( !s.equals( "(B,C);" ) ) {
return false;
}
if ( t11.getNumberOfExternalNodes() != 1 ) {
return false;
}
- s = w.toNewHampshire( t11, false, false ).toString();
+ s = w.toNewHampshire( t11, false ).toString();
if ( !s.equals( "B;" ) ) {
return false;
}
if ( t12.getNumberOfExternalNodes() != 8 ) {
return false;
}
- s = w.toNewHampshire( t12, false, true ).toString();
+ s = w.toNewHampshire( t12, true ).toString();
if ( !s.equals( "((A1,A2,A3),(B1,B3),(C1,C2,C3));" ) ) {
return false;
}
if ( t12.getNumberOfExternalNodes() != 7 ) {
return false;
}
- s = w.toNewHampshire( t12, false, true ).toString();
+ s = w.toNewHampshire( t12, true ).toString();
if ( !s.equals( "((A1,A2,A3),B1,(C1,C2,C3));" ) ) {
return false;
}
if ( t12.getNumberOfExternalNodes() != 6 ) {
return false;
}
- s = w.toNewHampshire( t12, false, true ).toString();
+ s = w.toNewHampshire( t12, true ).toString();
if ( !s.equals( "((A1,A2,A3),B1,(C1,C2));" ) ) {
return false;
}
if ( t12.getNumberOfExternalNodes() != 5 ) {
return false;
}
- s = w.toNewHampshire( t12, false, true ).toString();
+ s = w.toNewHampshire( t12, true ).toString();
if ( !s.equals( "((A2,A3),B1,(C1,C2));" ) ) {
return false;
}
if ( t12.getNumberOfExternalNodes() != 4 ) {
return false;
}
- s = w.toNewHampshire( t12, false, true ).toString();
+ s = w.toNewHampshire( t12, true ).toString();
if ( !s.equals( "((A2,A3),(C1,C2));" ) ) {
return false;
}
if ( t12.getNumberOfExternalNodes() != 3 ) {
return false;
}
- s = w.toNewHampshire( t12, false, true ).toString();
+ s = w.toNewHampshire( t12, true ).toString();
if ( !s.equals( "(A2,(C1,C2));" ) ) {
return false;
}
if ( t12.getNumberOfExternalNodes() != 2 ) {
return false;
}
- s = w.toNewHampshire( t12, false, true ).toString();
+ s = w.toNewHampshire( t12, true ).toString();
if ( !s.equals( "(C1,C2);" ) ) {
return false;
}
if ( t13.getNumberOfExternalNodes() != 4 ) {
return false;
}
- s = w.toNewHampshire( t13, false, true ).toString();
+ s = w.toNewHampshire( t13, true ).toString();
if ( !s.equals( "(A,B,C,E:5.0);" ) ) {
return false;
}
if ( t14.getNumberOfExternalNodes() != 5 ) {
return false;
}
- s = w.toNewHampshire( t14, false, true ).toString();
+ s = w.toNewHampshire( t14, true ).toString();
if ( !s.equals( "((A,B,C,D:1.1),F);" ) ) {
return false;
}
if ( bins1_2.length != 3 ) {
return false;
}
- if ( bins1_2[ 0 ] != 2 ) {
+ if ( bins1_2[ 0 ] != 2 ) {
+ return false;
+ }
+ if ( bins1_2[ 1 ] != 2 ) {
+ return false;
+ }
+ if ( bins1_2[ 2 ] != 2 ) {
+ return false;
+ }
+ final DescriptiveStatistics dss3 = new BasicDescriptiveStatistics();
+ dss3.addValue( 1 );
+ dss3.addValue( 1 );
+ dss3.addValue( 1 );
+ dss3.addValue( 2 );
+ dss3.addValue( 3 );
+ dss3.addValue( 4 );
+ dss3.addValue( 5 );
+ dss3.addValue( 5 );
+ dss3.addValue( 5 );
+ dss3.addValue( 6 );
+ dss3.addValue( 7 );
+ dss3.addValue( 8 );
+ dss3.addValue( 9 );
+ dss3.addValue( 10 );
+ dss3.addValue( 10 );
+ dss3.addValue( 10 );
+ final AsciiHistogram histo = new AsciiHistogram( dss3 );
+ histo.toStringBuffer( 10, '=', 40, 5 );
+ histo.toStringBuffer( 3, 8, 10, '=', 40, 5, null );
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace( System.out );
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testDir( final String file ) {
+ try {
+ final File f = new File( file );
+ if ( !f.exists() ) {
+ return false;
+ }
+ if ( !f.isDirectory() ) {
+ return false;
+ }
+ if ( !f.canRead() ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testEbiEntryRetrieval() {
+ try {
+ final SequenceDatabaseEntry entry = SequenceDbWsTools.obtainEntry( "AAK41263" );
+ if ( !entry.getAccession().equals( "AAK41263" ) ) {
+ System.out.println( entry.getAccession() );
+ return false;
+ }
+ if ( !entry.getTaxonomyScientificName().equals( "Sulfolobus solfataricus P2" ) ) {
+ System.out.println( entry.getTaxonomyScientificName() );
+ return false;
+ }
+ if ( !entry.getSequenceName()
+ .equals( "Sulfolobus solfataricus P2 Glycogen debranching enzyme, hypothetical (treX-like)" ) ) {
+ System.out.println( entry.getSequenceName() );
+ return false;
+ }
+ if ( !entry.getGeneName().equals( "treX-like" ) ) {
+ System.out.println( entry.getGeneName() );
+ return false;
+ }
+ if ( !entry.getTaxonomyIdentifier().equals( "273057" ) ) {
+ System.out.println( entry.getTaxonomyIdentifier() );
+ return false;
+ }
+ if ( !entry.getAnnotations().first().getRefValue().equals( "3.2.1.33" ) ) {
+ System.out.println( entry.getAnnotations().first().getRefValue() );
+ return false;
+ }
+ if ( !entry.getAnnotations().first().getRefSource().equals( "EC" ) ) {
+ System.out.println( entry.getAnnotations().first().getRefSource() );
+ return false;
+ }
+ if ( entry.getCrossReferences().size() < 1 ) {
+ return false;
+ }
+ final SequenceDatabaseEntry entry1 = SequenceDbWsTools.obtainEntry( "ABJ16409" );
+ if ( !entry1.getAccession().equals( "ABJ16409" ) ) {
+ return false;
+ }
+ if ( !entry1.getTaxonomyScientificName().equals( "Felis catus" ) ) {
+ System.out.println( entry1.getTaxonomyScientificName() );
+ return false;
+ }
+ if ( !entry1.getSequenceName().equals( "Felis catus (domestic cat) partial BCL2" ) ) {
+ System.out.println( entry1.getSequenceName() );
+ return false;
+ }
+ if ( !entry1.getTaxonomyIdentifier().equals( "9685" ) ) {
+ System.out.println( entry1.getTaxonomyIdentifier() );
+ return false;
+ }
+ if ( !entry1.getGeneName().equals( "BCL2" ) ) {
+ System.out.println( entry1.getGeneName() );
+ return false;
+ }
+ if ( entry1.getCrossReferences().size() < 1 ) {
+ return false;
+ }
+ final SequenceDatabaseEntry entry2 = SequenceDbWsTools.obtainEntry( "NM_184234" );
+ if ( !entry2.getAccession().equals( "NM_184234" ) ) {
+ return false;
+ }
+ if ( !entry2.getTaxonomyScientificName().equals( "Homo sapiens" ) ) {
+ System.out.println( entry2.getTaxonomyScientificName() );
+ return false;
+ }
+ if ( !entry2.getSequenceName()
+ .equals( "Homo sapiens RNA binding motif protein 39 (RBM39), transcript variant 1, mRNA" ) ) {
+ System.out.println( entry2.getSequenceName() );
+ return false;
+ }
+ if ( !entry2.getTaxonomyIdentifier().equals( "9606" ) ) {
+ System.out.println( entry2.getTaxonomyIdentifier() );
+ return false;
+ }
+ if ( !entry2.getGeneName().equals( "RBM39" ) ) {
+ System.out.println( entry2.getGeneName() );
+ return false;
+ }
+ if ( entry2.getCrossReferences().size() < 1 ) {
+ return false;
+ }
+ if ( !entry2.getChromosome().equals( "20" ) ) {
+ return false;
+ }
+ if ( !entry2.getMap().equals( "20q11.22" ) ) {
+ return false;
+ }
+ final SequenceDatabaseEntry entry3 = SequenceDbWsTools.obtainEntry( "HM043801" );
+ if ( !entry3.getAccession().equals( "HM043801" ) ) {
return false;
}
- if ( bins1_2[ 1 ] != 2 ) {
+ if ( !entry3.getTaxonomyScientificName().equals( "Bursaphelenchus xylophilus" ) ) {
+ System.out.println( entry3.getTaxonomyScientificName() );
return false;
}
- if ( bins1_2[ 2 ] != 2 ) {
+ if ( !entry3.getSequenceName().equals( "Bursaphelenchus xylophilus RAF gene, complete cds" ) ) {
+ System.out.println( entry3.getSequenceName() );
return false;
}
- final DescriptiveStatistics dss3 = new BasicDescriptiveStatistics();
- dss3.addValue( 1 );
- dss3.addValue( 1 );
- dss3.addValue( 1 );
- dss3.addValue( 2 );
- dss3.addValue( 3 );
- dss3.addValue( 4 );
- dss3.addValue( 5 );
- dss3.addValue( 5 );
- dss3.addValue( 5 );
- dss3.addValue( 6 );
- dss3.addValue( 7 );
- dss3.addValue( 8 );
- dss3.addValue( 9 );
- dss3.addValue( 10 );
- dss3.addValue( 10 );
- dss3.addValue( 10 );
- final AsciiHistogram histo = new AsciiHistogram( dss3 );
- histo.toStringBuffer( 10, '=', 40, 5 );
- histo.toStringBuffer( 3, 8, 10, '=', 40, 5, null );
- }
- catch ( final Exception e ) {
- e.printStackTrace( System.out );
- return false;
- }
- return true;
- }
-
- private static boolean testDir( final String file ) {
- try {
- final File f = new File( file );
- if ( !f.exists() ) {
+ if ( !entry3.getTaxonomyIdentifier().equals( "6326" ) ) {
+ System.out.println( entry3.getTaxonomyIdentifier() );
return false;
}
- if ( !f.isDirectory() ) {
+ if ( !entry3.getSequenceSymbol().equals( "RAF" ) ) {
+ System.out.println( entry3.getSequenceSymbol() );
return false;
}
- if ( !f.canRead() ) {
+ if ( !ForesterUtil.isEmpty( entry3.getGeneName() ) ) {
return false;
}
- }
- catch ( final Exception e ) {
- return false;
- }
- return true;
- }
-
- private static boolean testDomainId() {
- try {
- final DomainId id1 = new DomainId( "a" );
- final DomainId id2 = new DomainId( "a" );
- final DomainId id3 = new DomainId( "A" );
- final DomainId id4 = new DomainId( "b" );
- if ( !id1.equals( id1 ) ) {
+ if ( entry3.getCrossReferences().size() < 1 ) {
return false;
}
- if ( id1.getId().equals( "x" ) ) {
+ final SequenceDatabaseEntry entry4 = SequenceDbWsTools.obtainEntry( "AAA36557.1" );
+ if ( !entry4.getAccession().equals( "AAA36557" ) ) {
return false;
}
- if ( id1.getId().equals( null ) ) {
+ if ( !entry4.getTaxonomyScientificName().equals( "Homo sapiens" ) ) {
+ System.out.println( entry4.getTaxonomyScientificName() );
return false;
}
- if ( !id1.equals( id2 ) ) {
+ if ( !entry4.getSequenceName().equals( "Homo sapiens (human) ras protein" ) ) {
+ System.out.println( entry4.getSequenceName() );
return false;
}
- if ( id1.equals( id3 ) ) {
+ if ( !entry4.getTaxonomyIdentifier().equals( "9606" ) ) {
+ System.out.println( entry4.getTaxonomyIdentifier() );
return false;
}
- if ( id1.hashCode() != id1.hashCode() ) {
+ if ( !entry4.getGeneName().equals( "ras" ) ) {
+ System.out.println( entry4.getGeneName() );
return false;
}
- if ( id1.hashCode() != id2.hashCode() ) {
+ final SequenceDatabaseEntry entry5 = SequenceDbWsTools.obtainEntry( "AAZ45343.1" );
+ if ( !entry5.getAccession().equals( "AAZ45343" ) ) {
return false;
}
- if ( id1.hashCode() == id3.hashCode() ) {
+ if ( !entry5.getTaxonomyScientificName().equals( "Dechloromonas aromatica RCB" ) ) {
+ System.out.println( entry5.getTaxonomyScientificName() );
return false;
}
- if ( id1.compareTo( id1 ) != 0 ) {
+ if ( !entry5.getSequenceName().equals( "Dechloromonas aromatica RCB 1,4-alpha-glucan branching enzyme" ) ) {
+ System.out.println( entry5.getSequenceName() );
return false;
}
- if ( id1.compareTo( id2 ) != 0 ) {
+ if ( !entry5.getTaxonomyIdentifier().equals( "159087" ) ) {
+ System.out.println( entry5.getTaxonomyIdentifier() );
return false;
}
- if ( id1.compareTo( id3 ) != 0 ) {
+ final SequenceDatabaseEntry entry6 = SequenceDbWsTools.obtainEntry( "M30539" );
+ if ( !entry6.getAccession().equals( "M30539" ) ) {
return false;
}
- if ( id1.compareTo( id4 ) >= 0 ) {
+ if ( !entry6.getGeneName().equals( "ras" ) ) {
return false;
}
- if ( id4.compareTo( id1 ) <= 0 ) {
+ if ( !entry6.getSequenceName().equals( "Human SK2 c-Ha-ras-1 oncogene-encoded protein gene, exon 1" ) ) {
return false;
}
- if ( !id4.getId().equals( "b" ) ) {
+ if ( !entry6.getTaxonomyIdentifier().equals( "9606" ) ) {
return false;
}
- final DomainId id5 = new DomainId( " C " );
- if ( !id5.getId().equals( "C" ) ) {
+ if ( !entry6.getTaxonomyScientificName().equals( "Homo sapiens" ) ) {
return false;
}
- if ( id5.equals( id1 ) ) {
+ if ( entry6.getCrossReferences().size() < 1 ) {
return false;
}
}
- catch ( final Exception e ) {
+ catch ( final IOException e ) {
+ System.out.println();
+ System.out.println( "the following might be due to absence internet connection:" );
e.printStackTrace( System.out );
- return false;
- }
- return true;
- }
-
- private static boolean testEmblEntryRetrieval() {
- //The format for GenBank Accession numbers are:
- //Nucleotide: 1 letter + 5 numerals OR 2 letters + 6 numerals
- //Protein: 3 letters + 5 numerals
- //http://www.ncbi.nlm.nih.gov/Sequin/acc.html
- if ( !SequenceIdParser.parseGenbankAccessor( "AY423861" ).equals( "AY423861" ) ) {
- return false;
- }
- if ( !SequenceIdParser.parseGenbankAccessor( ".AY423861.2" ).equals( "AY423861.2" ) ) {
- return false;
- }
- if ( !SequenceIdParser.parseGenbankAccessor( "345_.AY423861.24_345" ).equals( "AY423861.24" ) ) {
- return false;
- }
- if ( SequenceIdParser.parseGenbankAccessor( "AAY423861" ) != null ) {
- return false;
- }
- if ( SequenceIdParser.parseGenbankAccessor( "AY4238612" ) != null ) {
- return false;
- }
- if ( SequenceIdParser.parseGenbankAccessor( "AAY4238612" ) != null ) {
- return false;
- }
- if ( SequenceIdParser.parseGenbankAccessor( "Y423861" ) != null ) {
- return false;
- }
- if ( !SequenceIdParser.parseGenbankAccessor( "S12345" ).equals( "S12345" ) ) {
- return false;
- }
- if ( !SequenceIdParser.parseGenbankAccessor( "|S12345|" ).equals( "S12345" ) ) {
- return false;
- }
- if ( SequenceIdParser.parseGenbankAccessor( "|S123456" ) != null ) {
- return false;
- }
- if ( SequenceIdParser.parseGenbankAccessor( "ABC123456" ) != null ) {
- return false;
- }
- if ( !SequenceIdParser.parseGenbankAccessor( "ABC12345" ).equals( "ABC12345" ) ) {
- return false;
- }
- if ( !SequenceIdParser.parseGenbankAccessor( "&ABC12345&" ).equals( "ABC12345" ) ) {
- return false;
+ return true;
}
- if ( SequenceIdParser.parseGenbankAccessor( "ABCD12345" ) != null ) {
+ catch ( final Exception e ) {
+ e.printStackTrace();
return false;
}
return true;
if ( !iter.next().getName().equals( "D" ) ) {
return false;
}
- if ( !iter.next().getName().equals( "E" ) ) {
+ if ( !iter.next().getName().equals( "E" ) ) {
+ return false;
+ }
+ if ( !iter.next().getName().equals( "F" ) ) {
+ return false;
+ }
+ if ( iter.hasNext() ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace( System.out );
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testExtractSNFromNodeName() {
+ try {
+ if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2_Mus_musculus" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2 Mus musculus" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_BCDO2" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus musculus musculus BCDO2" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_BCDO2" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2 Mus musculus musculus" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Bcl Mus musculus musculus" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( ParserUtils.extractScientificNameFromNodeName( "vcl Mus musculus musculus" ) != null ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "could_be_anything_Mus_musculus_musculus_BCDO2" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "could_be_anything_Mus_musculus_musculus_Musculus" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( ParserUtils.extractScientificNameFromNodeName( "could_be_anything_Mus_musculus_musculus_musculus" ) != null ) {
+ return false;
+ }
+ if ( ParserUtils.extractScientificNameFromNodeName( "musculus" ) != null ) {
+ return false;
+ }
+ if ( ParserUtils.extractScientificNameFromNodeName( "mus_musculus" ) != null ) {
+ return false;
+ }
+ if ( ParserUtils.extractScientificNameFromNodeName( "mus_musculus_musculus" ) != null ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_1" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_1" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_bcl" ) != null ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_BCL" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( ParserUtils.extractScientificNameFromNodeName( "Mus musculus bcl" ) != null ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus musculus BCL" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus musculus xBCL" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus musculus x1" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( " -XS12_Mus_musculus_12" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( " -1234_Mus_musculus_12 affrre e" )
+ .equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( " -1234_Mus_musculus_12_affrre_e" )
+ .equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_2bcl2" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_2bcl2" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_musculus_bcl2" )
+ .equals( "Mus musculus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Mus_musculus_123" ).equals( "Mus musculus" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Pilostyles mexicana Mexico Breedlove 27233" )
+ .equals( "Pilostyles mexicana" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia_coli_strain_K12/DH10B" )
+ .equals( "Escherichia coli strain K12/DH10B" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia_coli_str_K12/DH10B" )
+ .equals( "Escherichia coli str. K12/DH10B" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli str. K12/DH10B" )
+ .equals( "Escherichia coli str. K12/DH10B" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis_lyrata_subsp_lyrata" )
+ .equals( "Arabidopsis lyrata subsp. lyrata" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subsp. lyrata" )
+ .equals( "Arabidopsis lyrata subsp. lyrata" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subsp. lyrata 395" )
+ .equals( "Arabidopsis lyrata subsp. lyrata" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subsp. lyrata bcl2" )
+ .equals( "Arabidopsis lyrata subsp. lyrata" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subsp lyrata bcl2" )
+ .equals( "Arabidopsis lyrata subsp. lyrata" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Arabidopsis lyrata subspecies lyrata bcl2" )
+ .equals( "Arabidopsis lyrata subspecies lyrata" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Verbascum sinuatum var. adenosepalum bcl2" )
+ .equals( "Verbascum sinuatum var. adenosepalum" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (strain K12)" )
+ .equals( "Escherichia coli (strain K12)" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (strain K12) bcl2" )
+ .equals( "Escherichia coli (strain K12)" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (str. K12)" )
+ .equals( "Escherichia coli (str. K12)" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (str K12)" )
+ .equals( "Escherichia coli (str. K12)" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (str. K12) bcl2" )
+ .equals( "Escherichia coli (str. K12)" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli (var K12) bcl2" )
+ .equals( "Escherichia coli (var. K12)" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli str. K-12 substr. MG1655star" )
+ .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli str K-12 substr MG1655star" )
+ .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) {
+ return false;
+ }
+ if ( !ParserUtils
+ .extractScientificNameFromNodeName( "could be anything Escherichia coli str K-12 substr MG1655star" )
+ .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia coli str K-12 substr MG1655star gene1" )
+ .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) {
+ return false;
+ }
+ if ( !ParserUtils
+ .extractScientificNameFromNodeName( "could be anything Escherichia coli str K-12 substr MG1655star GENE1" )
+ .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia_coli_str_K-12_substr_MG1655star" )
+ .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Escherichia_coli_str_K-12_substr_MG1655star" )
+ .equals( "Escherichia coli str. K-12 substr. MG1655star" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Macrocera sp." ).equals( "Macrocera sp." ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Macrocera sp. 123" ).equals( "Macrocera sp." ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Macrocera sp. K12" ).equals( "Macrocera sp." ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "something Macrocera sp. K12" )
+ .equals( "Macrocera sp." ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Macrocera sp" ).equals( "Macrocera sp." ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Sesamum rigidum ssp merenskyanum 07 48" )
+ .equals( "Sesamum rigidum subsp. merenskyanum" ) ) {
+ return false;
+ }
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Sesamum rigidum ssp. merenskyanum" )
+ .equals( "Sesamum rigidum subsp. merenskyanum" ) ) {
return false;
}
- if ( !iter.next().getName().equals( "F" ) ) {
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Sesamum rigidum (ssp. merenskyanum)" )
+ .equals( "Sesamum rigidum (subsp. merenskyanum)" ) ) {
return false;
}
- if ( iter.hasNext() ) {
+ if ( !ParserUtils.extractScientificNameFromNodeName( "Sesamum rigidum (ssp merenskyanum)" )
+ .equals( "Sesamum rigidum (subsp. merenskyanum)" ) ) {
return false;
}
}
return true;
}
- private static boolean testExtractSNFromNodeName() {
+ private static boolean testExtractTaxonomyDataFromNodeName() {
try {
- if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2_Mus_musculus" ).equals( "Mus musculus" ) ) {
+ PhylogenyNode n = new PhylogenyNode( "tr|B1AM49|B1AM49_HUMAN" );
+ if ( !ParserUtils.extractTaxonomyDataFromNodeName( n, TAXONOMY_EXTRACTION.AGGRESSIVE ).equals( "HUMAN" ) ) {
return false;
}
- if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2_Mus_musculus_musculus" )
- .equals( "Mus musculus musculus" ) ) {
+ n = new PhylogenyNode( "tr|B1AM49|B1AM49_HUMAN~1-2" );
+ if ( !ParserUtils.extractTaxonomyDataFromNodeName( n, TAXONOMY_EXTRACTION.AGGRESSIVE ).equals( "HUMAN" ) ) {
return false;
}
- if ( !ParserUtils.extractScientificNameFromNodeName( "BCDO2_Mus_musculus_musculus-12" )
- .equals( "Mus musculus musculus" ) ) {
+ n = new PhylogenyNode( "tr|B1AM49|HNRPR_HUMAN" );
+ if ( !ParserUtils.extractTaxonomyDataFromNodeName( n, TAXONOMY_EXTRACTION.AGGRESSIVE ).equals( "HUMAN" ) ) {
return false;
}
- if ( !ParserUtils.extractScientificNameFromNodeName( " -XS12_Mus_musculus-12" ).equals( "Mus musculus" ) ) {
+ n = new PhylogenyNode( "tr|B1AM49|HNRPR_HUMAN|" );
+ if ( !ParserUtils.extractTaxonomyDataFromNodeName( n, TAXONOMY_EXTRACTION.AGGRESSIVE ).equals( "HUMAN" ) ) {
return false;
}
- if ( !ParserUtils.extractScientificNameFromNodeName( " -1234_Mus_musculus-12 affrre e" )
- .equals( "Mus musculus" ) ) {
+ n = new PhylogenyNode( "tr|B1AM49|HNRPR_HUMAN~12" );
+ if ( !ParserUtils.extractTaxonomyDataFromNodeName( n, TAXONOMY_EXTRACTION.AGGRESSIVE ).equals( "HUMAN" ) ) {
+ return false;
+ }
+ n = new PhylogenyNode( "HNRPR_HUMAN" );
+ if ( !ParserUtils.extractTaxonomyDataFromNodeName( n, TAXONOMY_EXTRACTION.AGGRESSIVE ).equals( "HUMAN" ) ) {
+ return false;
+ }
+ n = new PhylogenyNode( "HNRPR_HUMAN_X" );
+ if ( !ParserUtils.extractTaxonomyDataFromNodeName( n, TAXONOMY_EXTRACTION.AGGRESSIVE ).equals( "HUMAN" ) ) {
return false;
}
}
}
if ( !ParserUtils.extractTaxonomyCodeFromNodeName( "BCL2_MOUSE function = 23445",
TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED )
- .equals( "MOUSE" ) ) {
+ .equals( "MOUSE" ) ) {
return false;
}
if ( !ParserUtils.extractTaxonomyCodeFromNodeName( "BCL2_MOUSE+function = 23445",
TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED )
- .equals( "MOUSE" ) ) {
+ .equals( "MOUSE" ) ) {
return false;
}
if ( !ParserUtils.extractTaxonomyCodeFromNodeName( "BCL2_MOUSE|function = 23445",
TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED )
- .equals( "MOUSE" ) ) {
+ .equals( "MOUSE" ) ) {
return false;
}
if ( ParserUtils.extractTaxonomyCodeFromNodeName( "BCL2_MOUSEfunction = 23445",
try {
PhylogenyNode n = new PhylogenyNode();
n.setName( "tr|B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "tr.B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "tr=B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "tr-B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "tr/B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "tr\\B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "tr_B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( " tr|B3RJ64 " );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "-tr|B3RJ64-" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "-tr=B3RJ64-" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "_tr=B3RJ64_" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( " tr_tr|B3RJ64_sp|123 " );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
- n.setName( "sp|B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ n.setName( "B3RJ64" );
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
- n.setName( "ssp|B3RJ64" );
- if ( ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ) != null ) {
+ n.setName( "sp|B3RJ64" );
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "sp|B3RJ64C" );
- if ( ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ) != null ) {
+ if ( SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ) != null ) {
return false;
}
n.setName( "sp B3RJ64" );
- if ( ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ) != null ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n.setName( "sp|B3RJ6X" );
- if ( ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ) != null ) {
+ if ( SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ) != null ) {
return false;
}
n.setName( "sp|B3RJ6" );
- if ( ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ) != null ) {
+ if ( SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ) != null ) {
return false;
}
n.setName( "K1PYK7_CRAGI" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "K1PYK7_CRAGI" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "K1PYK7_CRAGI" ) ) {
return false;
}
n.setName( "K1PYK7_PEA" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "K1PYK7_PEA" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "K1PYK7_PEA" ) ) {
return false;
}
n.setName( "K1PYK7_RAT" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "K1PYK7_RAT" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "K1PYK7_RAT" ) ) {
return false;
}
n.setName( "K1PYK7_PIG" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "K1PYK7_PIG" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "K1PYK7_PIG" ) ) {
return false;
}
n.setName( "~K1PYK7_PIG~" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "K1PYK7_PIG" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "K1PYK7_PIG" ) ) {
return false;
}
n.setName( "123456_ECOLI-K1PYK7_CRAGI-sp" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "K1PYK7_CRAGI" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "K1PYK7_CRAGI" ) ) {
return false;
}
n.setName( "K1PYKX_CRAGI" );
- if ( ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ) != null ) {
+ if ( SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ) != null ) {
return false;
}
n.setName( "XXXXX_CRAGI" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "XXXXX_CRAGI" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "XXXXX_CRAGI" ) ) {
return false;
}
n.setName( "tr|H3IB65|H3IB65_STRPU~2-2" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "H3IB65" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "H3IB65" ) ) {
return false;
}
n.setName( "jgi|Lacbi2|181470|Lacbi1.estExt_GeneWisePlus_human.C_10729~2-3" );
- if ( ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ) != null ) {
+ if ( SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ) != null ) {
return false;
}
n.setName( "sp|Q86U06|RBM23_HUMAN~2-2" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "Q86U06" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "Q86U06" ) ) {
return false;
}
n = new PhylogenyNode();
org.forester.phylogeny.data.Sequence seq = new org.forester.phylogeny.data.Sequence();
seq.setSymbol( "K1PYK7_CRAGI" );
n.getNodeData().addSequence( seq );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "K1PYK7_CRAGI" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "K1PYK7_CRAGI" ) ) {
return false;
}
seq.setSymbol( "tr|B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n = new PhylogenyNode();
seq = new org.forester.phylogeny.data.Sequence();
seq.setName( "K1PYK7_CRAGI" );
n.getNodeData().addSequence( seq );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "K1PYK7_CRAGI" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "K1PYK7_CRAGI" ) ) {
return false;
}
seq.setName( "tr|B3RJ64" );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
n = new PhylogenyNode();
seq = new org.forester.phylogeny.data.Sequence();
seq.setAccession( new Accession( "K1PYK8_CRAGI", "?" ) );
n.getNodeData().addSequence( seq );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "K1PYK8_CRAGI" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "K1PYK8_CRAGI" ) ) {
return false;
}
n = new PhylogenyNode();
seq = new org.forester.phylogeny.data.Sequence();
seq.setAccession( new Accession( "tr|B3RJ64", "?" ) );
n.getNodeData().addSequence( seq );
- if ( !ForesterUtil.extractUniProtKbProteinSeqIdentifier( n ).equals( "B3RJ64" ) ) {
+ if ( !SequenceAccessionTools.obtainUniProtAccessorFromDataFields( n ).equals( "B3RJ64" ) ) {
return false;
}
//
n = new PhylogenyNode();
n.setName( "ACP19736" );
- if ( !ForesterUtil.extractGenbankAccessor( n ).equals( "ACP19736" ) ) {
+ if ( !SequenceAccessionTools.obtainGenbankAccessorFromDataFields( n ).equals( "ACP19736" ) ) {
return false;
}
n = new PhylogenyNode();
- n.setName( "_ACP19736_" );
- if ( !ForesterUtil.extractGenbankAccessor( n ).equals( "ACP19736" ) ) {
+ n.setName( "|ACP19736|" );
+ if ( !SequenceAccessionTools.obtainGenbankAccessorFromDataFields( n ).equals( "ACP19736" ) ) {
return false;
}
}
if ( !msa_0.getSequenceAsString( 1 ).toString().equalsIgnoreCase( "DKXASDFXSFXFKFKSXDFKSLX" ) ) {
return false;
}
- if ( !msa_0.getSequenceAsString( 2 ).toString().equalsIgnoreCase( "SXDFKSXLFSFPWEXPRXWXERR" ) ) {
+ if ( !msa_0.getSequenceAsString( 2 ).toString().equalsIgnoreCase( "SXDFKSXLFSFPWEXPROWXERR" ) ) {
return false;
}
if ( !msa_0.getSequenceAsString( 3 ).toString().equalsIgnoreCase( "AAAAAAAAAAAAAAAAAAAAAAA" ) ) {
return true;
}
+ private static boolean testGenbankAccessorParsing() {
+ //The format for GenBank Accession numbers are:
+ //Nucleotide: 1 letter + 5 numerals OR 2 letters + 6 numerals
+ //Protein: 3 letters + 5 numerals
+ //http://www.ncbi.nlm.nih.gov/Sequin/acc.html
+ if ( !SequenceAccessionTools.parseGenbankAccessorFromString( "AY423861" ).equals( "AY423861" ) ) {
+ return false;
+ }
+ if ( !SequenceAccessionTools.parseGenbankAccessorFromString( ".AY423861.2" ).equals( "AY423861.2" ) ) {
+ return false;
+ }
+ if ( !SequenceAccessionTools.parseGenbankAccessorFromString( "345_.AY423861.24_345" ).equals( "AY423861.24" ) ) {
+ return false;
+ }
+ if ( SequenceAccessionTools.parseGenbankAccessorFromString( "AAY423861" ) != null ) {
+ return false;
+ }
+ if ( SequenceAccessionTools.parseGenbankAccessorFromString( "AY4238612" ) != null ) {
+ return false;
+ }
+ if ( SequenceAccessionTools.parseGenbankAccessorFromString( "AAY4238612" ) != null ) {
+ return false;
+ }
+ if ( SequenceAccessionTools.parseGenbankAccessorFromString( "Y423861" ) != null ) {
+ return false;
+ }
+ if ( !SequenceAccessionTools.parseGenbankAccessorFromString( "S12345" ).equals( "S12345" ) ) {
+ return false;
+ }
+ if ( !SequenceAccessionTools.parseGenbankAccessorFromString( "|S12345|" ).equals( "S12345" ) ) {
+ return false;
+ }
+ if ( SequenceAccessionTools.parseGenbankAccessorFromString( "|S123456" ) != null ) {
+ return false;
+ }
+ if ( SequenceAccessionTools.parseGenbankAccessorFromString( "ABC123456" ) != null ) {
+ return false;
+ }
+ if ( !SequenceAccessionTools.parseGenbankAccessorFromString( "ABC12345" ).equals( "ABC12345" ) ) {
+ return false;
+ }
+ if ( !SequenceAccessionTools.parseGenbankAccessorFromString( "&ABC12345&" ).equals( "ABC12345" ) ) {
+ return false;
+ }
+ if ( SequenceAccessionTools.parseGenbankAccessorFromString( "ABCD12345" ) != null ) {
+ return false;
+ }
+ return true;
+ }
+
private static boolean testGeneralMsaParser() {
try {
final String msa_str_0 = "seq1 abcd\n\nseq2 efgh\n";
private static boolean testGetLCA2() {
try {
final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
- final Phylogeny p_a = factory.create( "(a)", new NHXParser() )[ 0 ];
+ // final Phylogeny p_a = factory.create( "(a)", new NHXParser() )[ 0 ];
+ final Phylogeny p_a = NHXParser.parse( "(a)" )[ 0 ];
PhylogenyMethods.preOrderReId( p_a );
final PhylogenyNode p_a_1 = PhylogenyMethods.calculateLCAonTreeWithIdsInPreOrder( p_a.getNode( "a" ),
p_a.getNode( "a" ) );
if ( !p_a_1.getName().equals( "a" ) ) {
return false;
}
- final Phylogeny p_b = factory.create( "((a)b)", new NHXParser() )[ 0 ];
+ final Phylogeny p_b = NHXParser.parse( "((a)b)" )[ 0 ];
PhylogenyMethods.preOrderReId( p_b );
final PhylogenyNode p_b_1 = PhylogenyMethods.calculateLCAonTreeWithIdsInPreOrder( p_b.getNode( "b" ),
p_b.getNode( "a" ) );
final String test_dir = Test.PATH_TO_TEST_DATA;
try {
final HmmscanPerDomainTableParser parser1 = new HmmscanPerDomainTableParser( new File( test_dir
- + ForesterUtil.getFileSeparator() + "hmmscan30b3_output_1" ), "MONBR", INDIVIDUAL_SCORE_CUTOFF.NONE );
+ + ForesterUtil.getFileSeparator() + "hmmscan30b3_output_1" ), "MONBR", INDIVIDUAL_SCORE_CUTOFF.NONE );
parser1.parse();
final HmmscanPerDomainTableParser parser2 = new HmmscanPerDomainTableParser( new File( test_dir
- + ForesterUtil.getFileSeparator() + "hmmscan30b3_output_2" ), "MONBR", INDIVIDUAL_SCORE_CUTOFF.NONE );
+ + ForesterUtil.getFileSeparator() + "hmmscan30b3_output_2" ), "MONBR", INDIVIDUAL_SCORE_CUTOFF.NONE );
final List<Protein> proteins = parser2.parse();
if ( parser2.getProteinsEncountered() != 4 ) {
return false;
if ( parser2.getDomainsIgnoredDueToDuf() != 0 ) {
return false;
}
- if ( parser2.getDomainsIgnoredDueToEval() != 0 ) {
+ if ( parser2.getDomainsIgnoredDueToFsEval() != 0 ) {
+ return false;
+ }
+ if ( parser2.getDomainsIgnoredDueToIEval() != 0 ) {
return false;
}
final Protein p1 = proteins.get( 0 );
if ( !Test.isEqual( p4.getProteinDomain( 0 ).getPerDomainScore(), 135.7 ) ) {
return false;
}
- if ( !Test.isEqual( p4.getProteinDomain( 0 ).getPerSequenceEvalue(), 8.3e-40 ) ) {
- return false;
- }
- if ( !Test.isEqual( p4.getProteinDomain( 0 ).getPerSequenceScore(), 136.3 ) ) {
- return false;
- }
if ( !Test.isEqual( p4.getProteinDomain( 0 ).getNumber(), 1 ) ) {
return false;
}
private static boolean testMsaQualityMethod() {
try {
- final Sequence s0 = BasicSequence.createAaSequence( "a", "ABAXEFGHIJ" );
- final Sequence s1 = BasicSequence.createAaSequence( "b", "ABBXEFGHIJ" );
- final Sequence s2 = BasicSequence.createAaSequence( "c", "AXCXEFGHIJ" );
- final Sequence s3 = BasicSequence.createAaSequence( "d", "AXDDEFGHIJ" );
- final List<Sequence> l = new ArrayList<Sequence>();
+ final MolecularSequence s0 = BasicSequence.createAaSequence( "a", "ABAXEFGHIJJE-" );
+ final MolecularSequence s1 = BasicSequence.createAaSequence( "b", "ABBXEFGHIJJBB" );
+ final MolecularSequence s2 = BasicSequence.createAaSequence( "c", "AXCXEFGHIJJ--" );
+ final MolecularSequence s3 = BasicSequence.createAaSequence( "d", "AXDDEFGHIJ---" );
+ final List<MolecularSequence> l = new ArrayList<MolecularSequence>();
l.add( s0 );
l.add( s1 );
l.add( s2 );
if ( !isEqual( 0.75, MsaMethods.calculateIdentityRatio( msa, 3 ) ) ) {
return false;
}
+ if ( !isEqual( 0.75, MsaMethods.calculateIdentityRatio( msa, 10 ) ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.25, MsaMethods.calculateIdentityRatio( msa, 11 ) ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.25, MsaMethods.calculateIdentityRatio( msa, 12 ) ) ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace( System.out );
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testMsaEntropy() {
+ try {
+ final MolecularSequence s0 = BasicSequence.createAaSequence( "a", "AAAAAAA" );
+ final MolecularSequence s1 = BasicSequence.createAaSequence( "b", "AAAIACC" );
+ final MolecularSequence s2 = BasicSequence.createAaSequence( "c", "AAIIIIF" );
+ final MolecularSequence s3 = BasicSequence.createAaSequence( "d", "AIIIVVW" );
+ final List<MolecularSequence> l = new ArrayList<MolecularSequence>();
+ l.add( s0 );
+ l.add( s1 );
+ l.add( s2 );
+ l.add( s3 );
+ final Msa msa = BasicMsa.createInstance( l );
+ //TODO need to DO the tests!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
+ //FIXME
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 0 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 1 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 2 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 3 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 4 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 5 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa, 6 ) );
+ // System.out.println();
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 0 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 1 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 2 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 3 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 4 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 5 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 6, msa, 6 ) );
+ final List<MolecularSequence> l2 = new ArrayList<MolecularSequence>();
+ l2.add( BasicSequence.createAaSequence( "1", "AAAAAAA" ) );
+ l2.add( BasicSequence.createAaSequence( "2", "AAAIACC" ) );
+ l2.add( BasicSequence.createAaSequence( "3", "AAIIIIF" ) );
+ l2.add( BasicSequence.createAaSequence( "4", "AIIIVVW" ) );
+ l2.add( BasicSequence.createAaSequence( "5", "AAAAAAA" ) );
+ l2.add( BasicSequence.createAaSequence( "6", "AAAIACC" ) );
+ l2.add( BasicSequence.createAaSequence( "7", "AAIIIIF" ) );
+ l2.add( BasicSequence.createAaSequence( "8", "AIIIVVW" ) );
+ l2.add( BasicSequence.createAaSequence( "9", "AAAAAAA" ) );
+ l2.add( BasicSequence.createAaSequence( "10", "AAAIACC" ) );
+ l2.add( BasicSequence.createAaSequence( "11", "AAIIIIF" ) );
+ l2.add( BasicSequence.createAaSequence( "12", "AIIIVVW" ) );
+ l2.add( BasicSequence.createAaSequence( "13", "AAIIIIF" ) );
+ l2.add( BasicSequence.createAaSequence( "14", "AIIIVVW" ) );
+ l2.add( BasicSequence.createAaSequence( "15", "AAAAAAA" ) );
+ l2.add( BasicSequence.createAaSequence( "16", "AAAIACC" ) );
+ l2.add( BasicSequence.createAaSequence( "17", "AAIIIIF" ) );
+ l2.add( BasicSequence.createAaSequence( "18", "AIIIVVW" ) );
+ l2.add( BasicSequence.createAaSequence( "19", "AAAAAAA" ) );
+ l2.add( BasicSequence.createAaSequence( "20", "AAAIACC" ) );
+ l2.add( BasicSequence.createAaSequence( "21", "AAIIIIF" ) );
+ l2.add( BasicSequence.createAaSequence( "22", "AIIIVVW" ) );
+ final Msa msa2 = BasicMsa.createInstance( l2 );
+ // System.out.println();
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa2, 0 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa2, 1 ) );
+ // System.out.println( MsaMethods.calcNormalizedShannonsEntropy( 20, msa2, 2 ) );
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace( System.out );
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testDeleteableMsa() {
+ try {
+ final MolecularSequence s0 = BasicSequence.createAaSequence( "a", "AAAA" );
+ final MolecularSequence s1 = BasicSequence.createAaSequence( "b", "BAAA" );
+ final MolecularSequence s2 = BasicSequence.createAaSequence( "c", "CAAA" );
+ final MolecularSequence s3 = BasicSequence.createAaSequence( "d", "DAAA" );
+ final MolecularSequence s4 = BasicSequence.createAaSequence( "e", "EAAA" );
+ final MolecularSequence s5 = BasicSequence.createAaSequence( "f", "FAAA" );
+ final List<MolecularSequence> l0 = new ArrayList<MolecularSequence>();
+ l0.add( s0 );
+ l0.add( s1 );
+ l0.add( s2 );
+ l0.add( s3 );
+ l0.add( s4 );
+ l0.add( s5 );
+ final DeleteableMsa dmsa0 = DeleteableMsa.createInstance( l0 );
+ dmsa0.deleteRow( "b", false );
+ if ( !dmsa0.getIdentifier( 1 ).equals( "c" ) ) {
+ return false;
+ }
+ dmsa0.deleteRow( "e", false );
+ dmsa0.deleteRow( "a", false );
+ dmsa0.deleteRow( "f", false );
+ if ( dmsa0.getLength() != 4 ) {
+ return false;
+ }
+ if ( dmsa0.getNumberOfSequences() != 2 ) {
+ return false;
+ }
+ if ( !dmsa0.getIdentifier( 0 ).equals( "c" ) ) {
+ return false;
+ }
+ if ( !dmsa0.getIdentifier( 1 ).equals( "d" ) ) {
+ return false;
+ }
+ if ( dmsa0.getResidueAt( 0, 0 ) != 'C' ) {
+ return false;
+ }
+ if ( !dmsa0.getSequenceAsString( 0 ).toString().equals( "CAAA" ) ) {
+ return false;
+ }
+ if ( dmsa0.getColumnAt( 0 ).size() != 2 ) {
+ return false;
+ }
+ dmsa0.deleteRow( "c", false );
+ dmsa0.deleteRow( "d", false );
+ if ( dmsa0.getNumberOfSequences() != 0 ) {
+ return false;
+ }
+ //
+ final MolecularSequence s_0 = BasicSequence.createAaSequence( "a", "--A---B-C--X----" );
+ final MolecularSequence s_1 = BasicSequence.createAaSequence( "b", "--B-----C-------" );
+ final MolecularSequence s_2 = BasicSequence.createAaSequence( "c", "--C--AB-C------Z" );
+ final MolecularSequence s_3 = BasicSequence.createAaSequence( "d", "--D--AA-C-------" );
+ final MolecularSequence s_4 = BasicSequence.createAaSequence( "e", "--E--AA-C-------" );
+ final MolecularSequence s_5 = BasicSequence.createAaSequence( "f", "--F--AB-CD--Y---" );
+ final List<MolecularSequence> l1 = new ArrayList<MolecularSequence>();
+ l1.add( s_0 );
+ l1.add( s_1 );
+ l1.add( s_2 );
+ l1.add( s_3 );
+ l1.add( s_4 );
+ l1.add( s_5 );
+ final DeleteableMsa dmsa1 = DeleteableMsa.createInstance( l1 );
+ dmsa1.deleteGapOnlyColumns();
+ dmsa1.deleteRow( "a", false );
+ dmsa1.deleteRow( "f", false );
+ dmsa1.deleteRow( "d", false );
+ dmsa1.deleteGapOnlyColumns();
+ if ( !dmsa1.getSequenceAsString( 0 ).toString().equals( "B--C-" ) ) {
+ return false;
+ }
+ if ( !dmsa1.getSequenceAsString( 1 ).toString().equals( "CABCZ" ) ) {
+ return false;
+ }
+ if ( !dmsa1.getSequenceAsString( 2 ).toString().equals( "EAAC-" ) ) {
+ return false;
+ }
+ dmsa1.deleteRow( "c", false );
+ dmsa1.deleteGapOnlyColumns();
+ final Writer w0 = new StringWriter();
+ dmsa1.write( w0, MSA_FORMAT.FASTA );
+ final Writer w1 = new StringWriter();
+ dmsa1.write( w1, MSA_FORMAT.PHYLIP );
+ if ( !dmsa1.getSequenceAsString( 0 ).toString().equals( "B--C" ) ) {
+ return false;
+ }
+ if ( !dmsa1.getSequenceAsString( 1 ).toString().equals( "EAAC" ) ) {
+ return false;
+ }
+ final MolecularSequence s__0 = BasicSequence.createAaSequence( "a", "A------" );
+ final MolecularSequence s__1 = BasicSequence.createAaSequence( "b", "BB-----" );
+ final MolecularSequence s__2 = BasicSequence.createAaSequence( "c", "CCC----" );
+ final MolecularSequence s__3 = BasicSequence.createAaSequence( "d", "DDDD---" );
+ final MolecularSequence s__4 = BasicSequence.createAaSequence( "e", "EEEEE--" );
+ final MolecularSequence s__5 = BasicSequence.createAaSequence( "f", "FFFFFF-" );
+ final List<MolecularSequence> l2 = new ArrayList<MolecularSequence>();
+ l2.add( s__0 );
+ l2.add( s__1 );
+ l2.add( s__2 );
+ l2.add( s__3 );
+ l2.add( s__4 );
+ l2.add( s__5 );
+ final DeleteableMsa dmsa2 = DeleteableMsa.createInstance( l2 );
+ dmsa2.deleteGapColumns( 0.5 );
+ if ( !dmsa2.getSequenceAsString( 0 ).toString().equals( "A---" ) ) {
+ return false;
+ }
+ if ( !dmsa2.getSequenceAsString( 1 ).toString().equals( "BB--" ) ) {
+ return false;
+ }
+ if ( !dmsa2.getSequenceAsString( 2 ).toString().equals( "CCC-" ) ) {
+ return false;
+ }
+ dmsa2.deleteGapColumns( 0.2 );
+ if ( !dmsa2.getSequenceAsString( 0 ).toString().equals( "A-" ) ) {
+ return false;
+ }
+ if ( !dmsa2.getSequenceAsString( 1 ).toString().equals( "BB" ) ) {
+ return false;
+ }
+ if ( !dmsa2.getSequenceAsString( 2 ).toString().equals( "CC" ) ) {
+ return false;
+ }
+ dmsa2.deleteGapColumns( 0 );
+ dmsa2.deleteRow( "a", false );
+ dmsa2.deleteRow( "b", false );
+ dmsa2.deleteRow( "f", false );
+ dmsa2.deleteRow( "e", false );
+ dmsa2.setIdentifier( 0, "new_c" );
+ dmsa2.setIdentifier( 1, "new_d" );
+ dmsa2.setResidueAt( 0, 0, 'x' );
+ final MolecularSequence s = dmsa2.deleteRow( "new_d", true );
+ if ( !s.getMolecularSequenceAsString().equals( "D" ) ) {
+ return false;
+ }
+ final Writer w = new StringWriter();
+ dmsa2.write( w, MSA_FORMAT.PHYLIP );
+ final String phylip = w.toString();
+ if ( !phylip.equals( "1 1" + ForesterUtil.LINE_SEPARATOR + "new_c x" + ForesterUtil.LINE_SEPARATOR ) ) {
+ System.out.println( phylip );
+ return false;
+ }
+ final Writer w2 = new StringWriter();
+ dmsa2.write( w2, MSA_FORMAT.FASTA );
+ final String fasta = w2.toString();
+ if ( !fasta.equals( ">new_c" + ForesterUtil.LINE_SEPARATOR + "x" + ForesterUtil.LINE_SEPARATOR ) ) {
+ System.out.println( fasta );
+ return false;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
if ( !ext.get( 4 ).getName().equals( "h" ) ) {
return false;
}
- //
- //
ext.clear();
final StringBuffer sb2 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h)gh)fgh)cdefgh)abcdefgh" );
final Phylogeny t2 = factory.create( sb2, new NHXParser() )[ 0 ];
if ( !ext.get( 3 ).getName().equals( "gh" ) ) {
return false;
}
- //
- //
ext.clear();
final StringBuffer sb3 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h)gh)fgh)cdefgh)abcdefgh" );
final Phylogeny t3 = factory.create( sb3, new NHXParser() )[ 0 ];
if ( !ext.get( 2 ).getName().equals( "fgh" ) ) {
return false;
}
- //
- //
ext.clear();
final StringBuffer sb4 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h)gh)fgh)cdefgh)abcdefgh" );
final Phylogeny t4 = factory.create( sb4, new NHXParser() )[ 0 ];
if ( n.getNextExternalNodeWhileTakingIntoAccountCollapsedNodes() != null ) {
return false;
}
- //
- //
final StringBuffer sb5 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h))fgh)cdefgh)abcdefgh" );
final Phylogeny t5 = factory.create( sb5, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 7 ).getName().equals( "h" ) ) {
return false;
}
- //
- //
final StringBuffer sb6 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h))fgh)cdefgh)abcdefgh" );
final Phylogeny t6 = factory.create( sb6, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 6 ).getName().equals( "h" ) ) {
return false;
}
- //
- //
final StringBuffer sb7 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h))fgh)cdefgh)abcdefgh" );
final Phylogeny t7 = factory.create( sb7, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 6 ).getName().equals( "h" ) ) {
return false;
}
- //
- //
final StringBuffer sb8 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h))fgh)cdefgh)abcdefgh" );
final Phylogeny t8 = factory.create( sb8, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 6 ).getName().equals( "h" ) ) {
return false;
}
- //
- //
final StringBuffer sb9 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h)gh)fgh)cdefgh)abcdefgh" );
final Phylogeny t9 = factory.create( sb9, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 6 ).getName().equals( "gh" ) ) {
return false;
}
- //
- //
final StringBuffer sb10 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h)gh)fgh)cdefgh)abcdefgh" );
final Phylogeny t10 = factory.create( sb10, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 6 ).getName().equals( "gh" ) ) {
return false;
}
- //
- //
final StringBuffer sb11 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h)gh)fgh)cdefgh)abcdefgh" );
final Phylogeny t11 = factory.create( sb11, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 5 ).getName().equals( "fgh" ) ) {
return false;
}
- //
- //
final StringBuffer sb12 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h)gh)fgh)cdefgh)abcdefgh" );
final Phylogeny t12 = factory.create( sb12, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 5 ).getName().equals( "fgh" ) ) {
return false;
}
- //
- //
final StringBuffer sb13 = new StringBuffer( "((a,b)ab,(((c,d)cd,e)cde,(f,(g,h)gh)fgh)cdefgh)abcdefgh" );
final Phylogeny t13 = factory.create( sb13, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 4 ).getName().equals( "fgh" ) ) {
return false;
}
- //
- //
final StringBuffer sb14 = new StringBuffer( "((a,b,0)ab,(((c,d)cd,e)cde,(f,(g,h,1,2)gh,0)fgh)cdefgh)abcdefgh" );
final Phylogeny t14 = factory.create( sb14, new NHXParser() )[ 0 ];
ext.clear();
if ( !ext.get( 4 ).getName().equals( "fgh" ) ) {
return false;
}
- //
- //
final StringBuffer sb15 = new StringBuffer( "((a,b,0)ab,(((c,d)cd,e)cde,x,(f,(g,h,1,2)gh,0)fgh)cdefgh)abcdefgh" );
final Phylogeny t15 = factory.create( sb15, new NHXParser() )[ 0 ];
ext.clear();
if ( phylogenies[ 17 ].getNumberOfExternalNodes() != 10 ) {
return false;
}
+ final NexusPhylogeniesParser p2 = new NexusPhylogeniesParser();
+ phylogenies = null;
+ phylogenies = factory.create( Test.PATH_TO_TEST_DATA + "S15613.nex", p2 );
+ if ( phylogenies.length != 9 ) {
+ return false;
+ }
+ if ( !isEqual( 0.48039661496919533, phylogenies[ 0 ].getNode( "Diadocidia_spinosula" )
+ .getDistanceToParent() ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.3959796191512233, phylogenies[ 0 ].getNode( "Diadocidia_stanfordensis" )
+ .getDistanceToParent() ) ) {
+ return false;
+ }
+ if ( !phylogenies[ 0 ].getName().equals( "Family Diadocidiidae MLT (Imported_tree_0)" ) ) {
+ return false;
+ }
+ if ( !phylogenies[ 1 ].getName().equals( "Family Diadocidiidae BAT (con_50_majrule)" ) ) {
+ return false;
+ }
+ if ( !phylogenies[ 2 ].getName().equals( "Family Diadocidiidae BAT (con_50_majrule)" ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.065284, phylogenies[ 7 ].getNode( "Bradysia_amoena" ).getDistanceToParent() ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.065284, phylogenies[ 8 ].getNode( "Bradysia_amoena" ).getDistanceToParent() ) ) {
+ return false;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
if ( phy != null ) {
return false;
}
- //
p.reset();
if ( !p.hasNext() ) {
return false;
if ( phy != null ) {
return false;
}
- ////
p.setSource( Test.PATH_TO_TEST_DATA + "nexus_test_2.nex" );
if ( !p.hasNext() ) {
return false;
if ( phy != null ) {
return false;
}
- //
p.reset();
if ( !p.hasNext() ) {
return false;
if ( phy != null ) {
return false;
}
- ////
p.setSource( Test.PATH_TO_TEST_DATA + "nexus_test_3.nex" );
if ( !p.hasNext() ) {
return false;
if ( phy != null ) {
return false;
}
- ////
+ //
p.setSource( Test.PATH_TO_TEST_DATA + "nexus_test_4_1.nex" );
- // if ( phylogenies.length != 18 ) {
- // return false;
- // }
- //0
if ( !p.hasNext() ) {
return false;
}
+ //0
phy = p.next();
if ( phy == null ) {
return false;
return false;
}
if ( phy.getNumberOfExternalNodes() != 3 ) {
+ System.out.println( phy.toString() );
return false;
}
if ( !phy.getName().equals( "" ) ) {
if ( phy.isRooted() ) {
return false;
}
+ //
+ final NexusPhylogeniesParser p2 = new NexusPhylogeniesParser();
+ p2.setSource( Test.PATH_TO_TEST_DATA + "S15613.nex" );
+ // 0
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ if ( !isEqual( 0.48039661496919533, phy.getNode( "Diadocidia_spinosula" ).getDistanceToParent() ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.3959796191512233, phy.getNode( "Diadocidia_stanfordensis" ).getDistanceToParent() ) ) {
+ return false;
+ }
+ // 1
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ // 2
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ // 3
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ // 4
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ // 5
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ // 6
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ // 7
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ // 8
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ if ( !isEqual( 0.065284, phy.getNode( "Bradysia_amoena" ).getDistanceToParent() ) ) {
+ return false;
+ }
+ if ( p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ if ( phy != null ) {
+ return false;
+ }
+ // 0
+ p2.reset();
+ if ( !p2.hasNext() ) {
+ return false;
+ }
+ phy = p2.next();
+ if ( !isEqual( 0.48039661496919533, phy.getNode( "Diadocidia_spinosula" ).getDistanceToParent() ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.3959796191512233, phy.getNode( "Diadocidia_stanfordensis" ).getDistanceToParent() ) ) {
+ return false;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
.equals( "Aranaeus" ) ) {
return false;
}
+ phylogenies = factory.create( Test.PATH_TO_TEST_DATA + "S14117.nex", parser );
+ if ( phylogenies.length != 3 ) {
+ return false;
+ }
+ if ( !isEqual( phylogenies[ 2 ].getNode( "Aloysia lycioides 251-76-02169" ).getDistanceToParent(),
+ 0.00100049 ) ) {
+ return false;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
nhxp.setTaxonomyExtraction( NHXParser.TAXONOMY_EXTRACTION.NO );
nhxp.setReplaceUnderscores( true );
final Phylogeny uc0 = factory.create( "(A__A_,_B_B)", nhxp )[ 0 ];
- if ( !uc0.getRoot().getChildNode( 0 ).getName().equals( "A A " ) ) {
+ if ( !uc0.getRoot().getChildNode( 0 ).getName().equals( "A A" ) ) {
return false;
}
- if ( !uc0.getRoot().getChildNode( 1 ).getName().equals( " B B" ) ) {
+ if ( !uc0.getRoot().getChildNode( 1 ).getName().equals( "B B" ) ) {
return false;
}
final Phylogeny p1b = factory
final Phylogeny[] p11 = factory.create( "(A,B11);(C,D11) (E,F11)\t(G,H11)", new NHXParser() );
final Phylogeny[] p12 = factory.create( "(A,B12) (C,D12) (E,F12) (G,H12)", new NHXParser() );
final Phylogeny[] p13 = factory.create( " ; (;A; , ; B ; 1 3 ; \n)\t ( \n ;"
- + " C ; ,; D;13;);;;;;;(;E;,;F;13 ;) ; "
- + "; ; ( \t\n\r\b; G ;, ;H ;1 3; ) ; ; ;",
- new NHXParser() );
+ + " C ; ,; D;13;);;;;;;(;E;,;F;13 ;) ; "
+ + "; ; ( \t\n\r\b; G ;, ;H ;1 3; ) ; ; ;",
+ new NHXParser() );
if ( !p13[ 0 ].toNewHampshireX().equals( "(';A;',';B;13;')" ) ) {
return false;
}
if ( p50.getNode( "A" ) == null ) {
return false;
}
- if ( !p50.toNewHampshire( false, NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS )
- .equals( "((A,B)ab:2.0[88],C);" ) ) {
+ if ( !p50.toNewHampshire( NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS )
+ .equals( "((A,B)ab:2.0[88],C);" ) ) {
+ return false;
+ }
+ if ( !p50.toNewHampshire( NH_CONVERSION_SUPPORT_VALUE_STYLE.NONE ).equals( "((A,B)ab:2.0,C);" ) ) {
+ return false;
+ }
+ if ( !p50.toNewHampshire( NH_CONVERSION_SUPPORT_VALUE_STYLE.AS_INTERNAL_NODE_NAMES )
+ .equals( "((A,B)88:2.0,C);" ) ) {
+ return false;
+ }
+ final Phylogeny p51 = factory.create( new StringBuffer( "((\"A(A\",B)ab:2[88],C)" ), new NHXParser() )[ 0 ];
+ if ( p51.getNode( "A(A" ) == null ) {
+ return false;
+ }
+ final Phylogeny p52 = factory.create( new StringBuffer( "(('A(A',B)ab:2[88],C)" ), new NHXParser() )[ 0 ];
+ if ( p52.getNode( "A(A" ) == null ) {
+ return false;
+ }
+ final Phylogeny p53 = factory
+ .create( new StringBuffer( "(('A(A',\"B (x (a' ,b) f(x);\"[com])[ment]ab:2[88],C)" ),
+ new NHXParser() )[ 0 ];
+ if ( p53.getNode( "B (x (a' ,b) f(x);" ) == null ) {
+ return false;
+ }
+ final Phylogeny p54 = factory.create( new StringBuffer( "((A,B):[88],C)" ), new NHXParser() )[ 0 ];
+ if ( p54.getNode( "A" ) == null ) {
+ return false;
+ }
+ if ( !p54.toNewHampshire( NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS ).equals( "((A,B)[88],C);" ) ) {
return false;
}
- if ( !p50.toNewHampshire( false, NH_CONVERSION_SUPPORT_VALUE_STYLE.NONE ).equals( "((A,B)ab:2.0,C);" ) ) {
+ final Phylogeny p55 = factory
+ .create( new StringBuffer( "((\"lcl|HPV32_L1.:1 s\":0.195593,\"lcl|HPV30_L1.1|;a\":0.114237):0.0359322,\"lcl|HPV56_L1.1|,d\":0.0727412,\"lcl|HPV66_L1.1x\":0.0798012);" ),
+ new NHXParser() )[ 0 ];
+ if ( !p55
+ .toNewHampshire()
+ .equals( "(('lcl|HPV32_L1.:1 s':0.195593,'lcl|HPV30_L1.1|;a':0.114237):0.0359322,'lcl|HPV56_L1.1|,d':0.0727412,lcl|HPV66_L1.1x:0.0798012);" ) ) {
+ System.out.println( p55.toNewHampshire() );
return false;
}
- if ( !p50.toNewHampshire( false, NH_CONVERSION_SUPPORT_VALUE_STYLE.AS_INTERNAL_NODE_NAMES )
- .equals( "((A,B)88:2.0,C);" ) ) {
+ final Phylogeny p56 = factory
+ .create( new StringBuffer( "((\"lcl|HPV32_L1.:1 s\":0.195593,\"lcl|HPV30_L1.1|;a\":0.114\n237):0.0359322,\"lcl|HPV56_L1.1|,d\":0.0727412,\"lcl|HPV66_L1.1:x\":0.0798012);" ),
+ new NHXParser() )[ 0 ];
+ if ( !p56
+ .toNewHampshire()
+ .equals( "(('lcl|HPV32_L1.:1 s':0.195593,'lcl|HPV30_L1.1|;a':0.114237):0.0359322,'lcl|HPV56_L1.1|,d':0.0727412,'lcl|HPV66_L1.1:x':0.0798012);" ) ) {
+ System.out.println( p56.toNewHampshire() );
return false;
}
- final Phylogeny p51 = factory.create( new StringBuffer( "((\"A(A\",B)ab:2[88],C)" ), new NHXParser() )[ 0 ];
- if ( p51.getNode( "A(A" ) == null ) {
+ final Phylogeny p57 = factory
+ .create( new StringBuffer( "((\"lcl|HPV32_L1.:1 s\":0.195593,\"lcl|HPV30_L1.1|;a\":0.114\n237):0.0359322,\"lcl|HPV56_L1.1|,d\":0.0727412,\"lcl|HPV66_L1.1:x\":0.0798012);" ),
+ new NHXParser() )[ 0 ];
+ if ( !p57
+ .toNewHampshire()
+ .equals( "(('lcl|HPV32_L1.:1 s':0.195593,'lcl|HPV30_L1.1|;a':0.114237):0.0359322,'lcl|HPV56_L1.1|,d':0.0727412,'lcl|HPV66_L1.1:x':0.0798012);" ) ) {
+ System.out.println( p56.toNewHampshire() );
return false;
}
- final Phylogeny p52 = factory.create( new StringBuffer( "(('A(A',B)ab:2[88],C)" ), new NHXParser() )[ 0 ];
- if ( p52.getNode( "A(A" ) == null ) {
+ final String s58 = "('Homo \"man\" sapiens:1',\"Homo 'man' sapiens;\")';root \"1_ )';";
+ final Phylogeny p58 = factory.create( new StringBuffer( s58 ), new NHXParser() )[ 0 ];
+ if ( !p58.toNewHampshire().equals( s58 ) ) {
+ System.out.println( p58.toNewHampshire() );
return false;
}
- final Phylogeny p53 = factory
- .create( new StringBuffer( "(('A(A',\"B (x (a' ,b) f(x);\"[com])[ment]ab:2[88],C)" ),
- new NHXParser() )[ 0 ];
- if ( p53.getNode( "B (x (a' ,b) f(x);" ) == null ) {
+ final String s59 = "('Homo \"man sapiens:1',\"Homo 'man sapiens\")\"root; '1_ )\";";
+ final Phylogeny p59 = factory.create( new StringBuffer( s59 ), new NHXParser() )[ 0 ];
+ if ( !p59.toNewHampshire().equals( s59 ) ) {
+ System.out.println( p59.toNewHampshire() );
return false;
}
- //
- final Phylogeny p54 = factory.create( new StringBuffer( "((A,B):[88],C)" ), new NHXParser() )[ 0 ];
- if ( p54.getNode( "A" ) == null ) {
+ final String s60 = "('\" ;,:\":\"',\"'abc def' g's_\",'=:0.45+,.:%~`!@#$%^&*()_-+={} | ;,');";
+ final Phylogeny p60 = factory.create( new StringBuffer( s60 ), new NHXParser() )[ 0 ];
+ if ( !p60.toNewHampshire().equals( s60 ) ) {
+ System.out.println( p60.toNewHampshire() );
return false;
}
- if ( !p54.toNewHampshire( false, NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS )
- .equals( "((A,B)[88],C);" ) ) {
+ final String s61 = "('H[omo] \"man\" sapiens:1',\"H[omo] 'man' sapiens;\",H[omo] sapiens)';root \"1_ )';";
+ final Phylogeny p61 = factory.create( new StringBuffer( s61 ), new NHXParser() )[ 0 ];
+ if ( !p61.toNewHampshire()
+ .equals( "('H{omo} \"man\" sapiens:1',\"H{omo} 'man' sapiens;\",Hsapiens)';root \"1_ )';" ) ) {
+ System.out.println( p61.toNewHampshire() );
return false;
}
}
if ( p.next() != null ) {
return false;
}
+ //
+ final String p30_str = "(A,B);(C,D)";
+ final NHXParser p30 = new NHXParser();
+ p30.setSource( p30_str );
+ if ( !p30.hasNext() ) {
+ return false;
+ }
+ Phylogeny phy30 = p30.next();
+ if ( !phy30.toNewHampshire().equals( "(A,B);" ) ) {
+ System.out.println( phy30.toNewHampshire() );
+ return false;
+ }
+ if ( !p30.hasNext() ) {
+ return false;
+ }
+ Phylogeny phy301 = p30.next();
+ if ( !phy301.toNewHampshire().equals( "(C,D);" ) ) {
+ System.out.println( phy301.toNewHampshire() );
+ return false;
+ }
+ if ( p30.hasNext() ) {
+ return false;
+ }
+ if ( p30.hasNext() ) {
+ return false;
+ }
+ if ( p30.next() != null ) {
+ return false;
+ }
+ if ( p30.next() != null ) {
+ return false;
+ }
+ p30.reset();
+ if ( !p30.hasNext() ) {
+ return false;
+ }
+ phy30 = p30.next();
+ if ( !phy30.toNewHampshire().equals( "(A,B);" ) ) {
+ System.out.println( phy30.toNewHampshire() );
+ return false;
+ }
+ if ( !p30.hasNext() ) {
+ return false;
+ }
+ phy301 = p30.next();
+ if ( !phy301.toNewHampshire().equals( "(C,D);" ) ) {
+ System.out.println( phy301.toNewHampshire() );
+ return false;
+ }
+ if ( p30.hasNext() ) {
+ return false;
+ }
+ if ( p30.hasNext() ) {
+ return false;
+ }
+ if ( p30.next() != null ) {
+ return false;
+ }
+ if ( p30.next() != null ) {
+ return false;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
System.out.println( n6.toNewHampshireX() );
return false;
}
+ final PhylogenyNode n7 = new PhylogenyNode();
+ n7.setName( " gks:dr-m4 \" ' `@:[]sadq04 " );
+ if ( !n7.toNewHampshire( true, PhylogenyNode.NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS )
+ .equals( "'gks:dr-m4 \" ` `@:[]sadq04'" ) ) {
+ System.out.println( n7
+ .toNewHampshire( true, PhylogenyNode.NH_CONVERSION_SUPPORT_VALUE_STYLE.IN_SQUARE_BRACKETS ) );
+ return false;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
return false;
}
final PhylogenyNode n13 = PhylogenyNode
- .createInstanceFromNhxString( "blah_12345/1-2", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
- if ( !n13.getName().equals( "blah_12345/1-2" ) ) {
+ .createInstanceFromNhxString( "BLAH_12345/1-2", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ if ( !n13.getName().equals( "BLAH_12345/1-2" ) ) {
return false;
}
if ( PhylogenyMethods.getSpecies( n13 ).equals( "12345" ) ) {
return false;
}
final PhylogenyNode n19 = PhylogenyNode
- .createInstanceFromNhxString( "blah_1-roejojoej", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BLAH_1-roejojoej", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( !n19.getNodeData().getTaxonomy().getIdentifier().getValue().equals( "1" ) ) {
return false;
}
return false;
}
final PhylogenyNode n30 = PhylogenyNode
- .createInstanceFromNhxString( "blah_1234567-roejojoej",
+ .createInstanceFromNhxString( "BLAH_1234567-roejojoej",
NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( !n30.getNodeData().getTaxonomy().getIdentifier().getValue().equals( "1234567" ) ) {
return false;
return false;
}
final PhylogenyNode n31 = PhylogenyNode
- .createInstanceFromNhxString( "blah_12345678-roejojoej",
+ .createInstanceFromNhxString( "BLAH_12345678-roejojoej",
NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( n31.getNodeData().isHasTaxonomy() ) {
return false;
return false;
}
final PhylogenyNode n40 = PhylogenyNode
- .createInstanceFromNhxString( "bcl2_12345", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BCL2_12345", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( !n40.getNodeData().getTaxonomy().getIdentifier().getValue().equals( "12345" ) ) {
return false;
}
if ( !p10.toNewHampshireX().equals( "((A:0.2,B:0.3):0.5[&&NHX:B=91],C:0.1)root:0.1[&&NHX:B=100]" ) ) {
return false;
}
+ final Phylogeny p11 = factory
+ .create( " [79] ( ('A: \" ' [co mment] :0 .2[comment],B:0.3[com])[com ment]: 0. 5 \t[ 9 1 ][ comment],C: 0.1)[comment]root:0.1[100] [comment]",
+ new NHXParser() )[ 0 ];
+ if ( !p11.toNewHampshireX().equals( "(('A: \"':0.2,B:0.3):0.5[&&NHX:B=91],C:0.1)root:0.1[&&NHX:B=100]" ) ) {
+ return false;
+ }
+ final Phylogeny p12 = factory.create( "((A:0.2,B:0.3):0.5[&&NHX:B=91],C:0.1)root:0.1[&&NHX:B=100]",
+ new NHXParser() )[ 0 ];
+ if ( !p12.toNewHampshireX().equals( "((A:0.2,B:0.3):0.5[&&NHX:B=91],C:0.1)root:0.1[&&NHX:B=100]" ) ) {
+ return false;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
}
final Phylogeny p2 = factory
.create( "(1[something_else(?)s,prob=0.9500000000000000e+00{}(((,p)rob_stddev=0.110000000000e+00,"
- + "prob_range={1.000000000000000e+00,1.000000000000000e+00},prob(percent)=\"100\","
- + "prob+-sd=\"100+-0\"]:4.129000000000000e-02[&length_mean=4.153987461671767e-02,"
- + "length_median=4.129000000000000e-02,length_95%HPD={3.217800000000000e-02,"
- + "5.026800000000000e-02}],2[&prob=0.810000000000000e+00,prob_stddev=0.000000000000000e+00,"
- + "prob_range={1.000000000000000e+00,1.000000000000000e+00},prob(percent)=\"100\","
- + "prob+-sd=\"100+-0\"]:6.375699999999999e-02[&length_mean=6.395210411945065e-02,"
- + "length_median=6.375699999999999e-02,length_95%HPD={5.388600000000000e-02,"
- + "7.369400000000000e-02}])",
- new NHXParser() )[ 0 ];
+ + "prob_range={1.000000000000000e+00,1.000000000000000e+00},prob(percent)=\"100\","
+ + "prob+-sd=\"100+-0\"]:4.129000000000000e-02[&length_mean=4.153987461671767e-02,"
+ + "length_median=4.129000000000000e-02,length_95%HPD={3.217800000000000e-02,"
+ + "5.026800000000000e-02}],2[&prob=0.810000000000000e+00,prob_stddev=0.000000000000000e+00,"
+ + "prob_range={1.000000000000000e+00,1.000000000000000e+00},prob(percent)=\"100\","
+ + "prob+-sd=\"100+-0\"]:6.375699999999999e-02[&length_mean=6.395210411945065e-02,"
+ + "length_median=6.375699999999999e-02,length_95%HPD={5.388600000000000e-02,"
+ + "7.369400000000000e-02}])",
+ new NHXParser() )[ 0 ];
if ( p2.getNode( "1" ) == null ) {
return false;
}
if ( phy.getNodes( "'single quotes' inside double quotes" ).size() != 1 ) {
return false;
}
- if ( phy.getNodes( "double quotes inside single quotes" ).size() != 1 ) {
+ if ( phy.getNodes( "\"double quotes\" inside single quotes" ).size() != 1 ) {
return false;
}
if ( phy.getNodes( "noquotes" ).size() != 1 ) {
return false;
}
- if ( phy.getNodes( "A ( B C '" ).size() != 1 ) {
+ if ( phy.getNodes( "A ( B C '" ).size() != 1 ) {
return false;
}
final NHXParser p1p = new NHXParser();
final Phylogeny p10 = factory
.create( " [79] ( (\"A \n\tB \" [co mment] :0 .2[comment],'B':0.3[com])[com ment]: 0. 5 \t[ 9 1 ][ comment],'C (or D?\\//;,))': 0.1)[comment]'\nroot is here (cool, was! ) ':0.1[100] [comment]",
new NHXParser() )[ 0 ];
- final String p10_clean_str = "(('A B':0.2,B:0.3):0.5[&&NHX:B=91],'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1[&&NHX:B=100]";
+ final String p10_clean_str = "(('A B':0.2,B:0.3):0.5[&&NHX:B=91],'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1[&&NHX:B=100]";
if ( !p10.toNewHampshireX().equals( p10_clean_str ) ) {
return false;
}
if ( !p11.toNewHampshireX().equals( p10_clean_str ) ) {
return false;
}
- //
final Phylogeny p12 = factory
.create( " [79] ( (\"A \n\tB \" [[][] :0 .2[comment][\t&\t&\n N\tH\tX:S=mo\tnkey !],'\tB\t\b\t\n\f\rB B ':0.0\b3[])\t[com ment]: 0. 5 \t[ 9 1 ][ \ncomment],'C\t (or D?\\//;,))': 0.\b1)[comment]'\nroot \tis here (cool, \b\t\n\f\r was! ) ':0.1[100] [comment]",
new NHXParser() )[ 0 ];
- final String p12_clean_str = "(('A B':0.2[&&NHX:S=monkey!],'BB B':0.03):0.5[&&NHX:B=91],'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1[&&NHX:B=100]";
+ final String p12_clean_str = "(('A B':0.2[&&NHX:S=monkey!],'BB B':0.03):0.5[&&NHX:B=91],'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1[&&NHX:B=100]";
if ( !p12.toNewHampshireX().equals( p12_clean_str ) ) {
return false;
}
if ( !p13.toNewHampshireX().equals( p12_clean_str ) ) {
return false;
}
- final String p12_clean_str_nh = "(('A B':0.2,'BB B':0.03):0.5,'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1;";
+ final String p12_clean_str_nh = "(('A B':0.2,'BB B':0.03):0.5,'C (or D?\\//;,))':0.1)'root is here (cool, was! )':0.1;";
if ( !p13.toNewHampshire().equals( p12_clean_str_nh ) ) {
return false;
}
// Do nothing -- means were not running from jar.
}
if ( xml_parser == null ) {
- xml_parser = new PhyloXmlParser();
+ xml_parser = PhyloXmlParser.createPhyloXmlParser();
if ( USE_LOCAL_PHYLOXML_SCHEMA ) {
xml_parser.setValidateAgainstSchema( PHYLOXML_LOCAL_XSD );
}
// J. of Comput Bio. Vol. 4, No 2, pp.177-187
final Phylogeny species6 = factory
.create( "(((1:[&&NHX:S=1],5:[&&NHX:S=5])1-5,((4:[&&NHX:S=4],6:[&&NHX:S=6])4-6,2:[&&NHX:S=2])4-6-2)1-5-4-6-2,"
- + "((9:[&&NHX:S=9],3:[&&NHX:S=3])9-3,(8:[&&NHX:S=8],7:[&&NHX:S=7])8-7)9-3-8-7)",
- new NHXParser() )[ 0 ];
+ + "((9:[&&NHX:S=9],3:[&&NHX:S=3])9-3,(8:[&&NHX:S=8],7:[&&NHX:S=7])8-7)9-3-8-7)",
+ new NHXParser() )[ 0 ];
final Phylogeny gene6 = factory
.create( "(((1:0.1[&&NHX:S=1],2:0.1[&&NHX:S=2])1-2:0.1,3:0.1[&&NHX:S=3])1-2-3:0.1,"
- + "((4:0.1[&&NHX:S=4],(5:0.1[&&NHX:S=5],6:0.1[&&NHX:S=6])5-6:0.1)4-5-6:0.1,"
- + "(7:0.1[&&NHX:S=7],(8:0.1[&&NHX:S=8],9:0.1[&&NHX:S=9])8-9:0.1)7-8-9:0.1)4-5-6-7-8-9:0.1)r;",
- new NHXParser() )[ 0 ];
+ + "((4:0.1[&&NHX:S=4],(5:0.1[&&NHX:S=5],6:0.1[&&NHX:S=6])5-6:0.1)4-5-6:0.1,"
+ + "(7:0.1[&&NHX:S=7],(8:0.1[&&NHX:S=8],9:0.1[&&NHX:S=9])8-9:0.1)7-8-9:0.1)4-5-6-7-8-9:0.1)r;",
+ new NHXParser() )[ 0 ];
species6.setRooted( true );
gene6.setRooted( true );
final SDI sdi6 = new SDI( gene6, species6 );
}
final Phylogeny species6 = factory
.create( "(((1:[&&NHX:S=1],5:[&&NHX:S=5])1-5,((4:[&&NHX:S=4],6:[&&NHX:S=6])4-6,2:[&&NHX:S=2])4-6-2)1-5-4-6-2,"
- + "((9:[&&NHX:S=9],3:[&&NHX:S=3])9-3,(8:[&&NHX:S=8],7:[&&NHX:S=7])8-7)9-3-8-7)",
- new NHXParser() )[ 0 ];
+ + "((9:[&&NHX:S=9],3:[&&NHX:S=3])9-3,(8:[&&NHX:S=8],7:[&&NHX:S=7])8-7)9-3-8-7)",
+ new NHXParser() )[ 0 ];
final Phylogeny gene6 = factory
.create( "((5:0.1[&&NHX:S=5],6:0.1[&&NHX:S=6])5-6:0.05[&&NHX:S=6],(4:0.1[&&NHX:S=4],"
- + "(((1:0.1[&&NHX:S=1],2:0.1[&&NHX:S=2])1-2:0.1[&&NHX:S=2],3:0.25[&&NHX:S=3])1-2-3:0.2[&&NHX:S=2],"
- + "(7:0.1[&&NHX:S=7],(8:0.1[&&NHX:S=8],"
- + "9:0.1[&&NHX:S=9])8-9:0.1[&&NHX:S=9])7-8-9:0.1[&&NHX:S=8])"
- + "4-5-6-7-8-9:0.1[&&NHX:S=5])4-5-6:0.05[&&NHX:S=5])",
- new NHXParser() )[ 0 ];
+ + "(((1:0.1[&&NHX:S=1],2:0.1[&&NHX:S=2])1-2:0.1[&&NHX:S=2],3:0.25[&&NHX:S=3])1-2-3:0.2[&&NHX:S=2],"
+ + "(7:0.1[&&NHX:S=7],(8:0.1[&&NHX:S=8],"
+ + "9:0.1[&&NHX:S=9])8-9:0.1[&&NHX:S=9])7-8-9:0.1[&&NHX:S=8])"
+ + "4-5-6-7-8-9:0.1[&&NHX:S=5])4-5-6:0.05[&&NHX:S=5])",
+ new NHXParser() )[ 0 ];
species6.setRooted( true );
gene6.setRooted( true );
Phylogeny[] p6 = sdi_unrooted.infer( gene6, species6, false, true, true, true, 10 );
p6 = null;
final Phylogeny species7 = factory
.create( "(((1:[&&NHX:S=1],5:[&&NHX:S=5])1-5,((4:[&&NHX:S=4],6:[&&NHX:S=6])4-6,2:[&&NHX:S=2])4-6-2)1-5-4-6-2,"
- + "((9:[&&NHX:S=9],3:[&&NHX:S=3])9-3,(8:[&&NHX:S=8],7:[&&NHX:S=7])8-7)9-3-8-7)",
- new NHXParser() )[ 0 ];
+ + "((9:[&&NHX:S=9],3:[&&NHX:S=3])9-3,(8:[&&NHX:S=8],7:[&&NHX:S=7])8-7)9-3-8-7)",
+ new NHXParser() )[ 0 ];
final Phylogeny gene7 = factory
.create( "((5:0.1[&&NHX:S=5],6:0.1[&&NHX:S=6])5-6:0.05[&&NHX:S=6],(4:0.1[&&NHX:S=4],"
- + "(((1:0.1[&&NHX:S=1],2:0.1[&&NHX:S=2])1-2:0.1[&&NHX:S=2],3:0.25[&&NHX:S=3])1-2-3:0.2[&&NHX:S=2],"
- + "(7:0.1[&&NHX:S=7],(8:0.1[&&NHX:S=8],"
- + "9:0.1[&&NHX:S=9])8-9:0.1[&&NHX:S=9])7-8-9:0.1[&&NHX:S=8])"
- + "4-5-6-7-8-9:0.1[&&NHX:S=5])4-5-6:0.05[&&NHX:S=5])",
- new NHXParser() )[ 0 ];
+ + "(((1:0.1[&&NHX:S=1],2:0.1[&&NHX:S=2])1-2:0.1[&&NHX:S=2],3:0.25[&&NHX:S=3])1-2-3:0.2[&&NHX:S=2],"
+ + "(7:0.1[&&NHX:S=7],(8:0.1[&&NHX:S=8],"
+ + "9:0.1[&&NHX:S=9])8-9:0.1[&&NHX:S=9])7-8-9:0.1[&&NHX:S=8])"
+ + "4-5-6-7-8-9:0.1[&&NHX:S=5])4-5-6:0.05[&&NHX:S=5])",
+ new NHXParser() )[ 0 ];
species7.setRooted( true );
gene7.setRooted( true );
Phylogeny[] p7 = sdi_unrooted.infer( gene7, species7, true, true, true, true, 10 );
p7 = null;
final Phylogeny species8 = factory
.create( "(((1:[&&NHX:S=1],5:[&&NHX:S=5])1-5,((4:[&&NHX:S=4],6:[&&NHX:S=6])4-6,2:[&&NHX:S=2])4-6-2)1-5-4-6-2,"
- + "((9:[&&NHX:S=9],3:[&&NHX:S=3])9-3,(8:[&&NHX:S=8],7:[&&NHX:S=7])8-7)9-3-8-7)",
- new NHXParser() )[ 0 ];
+ + "((9:[&&NHX:S=9],3:[&&NHX:S=3])9-3,(8:[&&NHX:S=8],7:[&&NHX:S=7])8-7)9-3-8-7)",
+ new NHXParser() )[ 0 ];
final Phylogeny gene8 = factory
.create( "((5:0.1[&&NHX:S=5],6:0.1[&&NHX:S=6])5-6:0.05[&&NHX:S=6],(4:0.1[&&NHX:S=4],"
- + "(((1:0.1[&&NHX:S=1],2:0.1[&&NHX:S=2])1-2:0.1[&&NHX:S=2],3:0.25[&&NHX:S=3])1-2-3:0.2[&&NHX:S=2],"
- + "(7:0.1[&&NHX:S=7],(8:0.1[&&NHX:S=8],"
- + "9:0.1[&&NHX:S=9])8-9:0.1[&&NHX:S=9])7-8-9:0.1[&&NHX:S=8])"
- + "4-5-6-7-8-9:0.1[&&NHX:S=5])4-5-6:0.05[&&NHX:S=5])",
- new NHXParser() )[ 0 ];
+ + "(((1:0.1[&&NHX:S=1],2:0.1[&&NHX:S=2])1-2:0.1[&&NHX:S=2],3:0.25[&&NHX:S=3])1-2-3:0.2[&&NHX:S=2],"
+ + "(7:0.1[&&NHX:S=7],(8:0.1[&&NHX:S=8],"
+ + "9:0.1[&&NHX:S=9])8-9:0.1[&&NHX:S=9])7-8-9:0.1[&&NHX:S=8])"
+ + "4-5-6-7-8-9:0.1[&&NHX:S=5])4-5-6:0.05[&&NHX:S=5])",
+ new NHXParser() )[ 0 ];
species8.setRooted( true );
gene8.setRooted( true );
Phylogeny[] p8 = sdi_unrooted.infer( gene8, species8, false, false, true, true, 10 );
return true;
}
+ private static boolean testSequenceDbWsTools1() {
+ try {
+ final PhylogenyNode n = new PhylogenyNode();
+ n.setName( "NP_001025424" );
+ Accession acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.REFSEQ.toString() )
+ || !acc.getValue().equals( "NP_001025424" ) ) {
+ return false;
+ }
+ n.setName( "340 0559 -- _NP_001025424_dsfdg15 05" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.REFSEQ.toString() )
+ || !acc.getValue().equals( "NP_001025424" ) ) {
+ return false;
+ }
+ n.setName( "NP_001025424.1" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.REFSEQ.toString() )
+ || !acc.getValue().equals( "NP_001025424" ) ) {
+ return false;
+ }
+ n.setName( "NM_001030253" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.REFSEQ.toString() )
+ || !acc.getValue().equals( "NM_001030253" ) ) {
+ return false;
+ }
+ n.setName( "BCL2_HUMAN" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.UNIPROT.toString() )
+ || !acc.getValue().equals( "BCL2_HUMAN" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "P10415" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.UNIPROT.toString() )
+ || !acc.getValue().equals( "P10415" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( " P10415 " );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.UNIPROT.toString() )
+ || !acc.getValue().equals( "P10415" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "_P10415|" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.UNIPROT.toString() )
+ || !acc.getValue().equals( "P10415" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "AY695820" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.NCBI.toString() )
+ || !acc.getValue().equals( "AY695820" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "_AY695820_" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.NCBI.toString() )
+ || !acc.getValue().equals( "AY695820" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "AAA59452" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.NCBI.toString() )
+ || !acc.getValue().equals( "AAA59452" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "_AAA59452_" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.NCBI.toString() )
+ || !acc.getValue().equals( "AAA59452" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "AAA59452.1" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.NCBI.toString() )
+ || !acc.getValue().equals( "AAA59452.1" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "_AAA59452.1_" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.NCBI.toString() )
+ || !acc.getValue().equals( "AAA59452.1" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "GI:94894583" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.GI.toString() )
+ || !acc.getValue().equals( "94894583" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "gi|71845847|1,4-alpha-glucan branching enzyme [Dechloromonas aromatica RCB]" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.GI.toString() )
+ || !acc.getValue().equals( "71845847" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ n.setName( "gi|71845847|gb|AAZ45343.1| 1,4-alpha-glucan branching enzyme [Dechloromonas aromatica RCB]" );
+ acc = SequenceDbWsTools.obtainSeqAccession( n );
+ if ( ( acc == null ) || !acc.getSource().equals( Source.NCBI.toString() )
+ || !acc.getValue().equals( "AAZ45343.1" ) ) {
+ System.out.println( acc.toString() );
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testSequenceDbWsTools2() {
+ try {
+ final PhylogenyNode n1 = new PhylogenyNode( "NP_001025424" );
+ SequenceDbWsTools.obtainSeqInformation( n1 );
+ if ( !n1.getNodeData().getSequence().getName().equals( "Bcl2" ) ) {
+ return false;
+ }
+ if ( !n1.getNodeData().getTaxonomy().getScientificName().equals( "Danio rerio" ) ) {
+ return false;
+ }
+ if ( !n1.getNodeData().getSequence().getAccession().getSource().equals( Source.REFSEQ.toString() ) ) {
+ return false;
+ }
+ if ( !n1.getNodeData().getSequence().getAccession().getValue().equals( "NP_001025424" ) ) {
+ return false;
+ }
+ final PhylogenyNode n2 = new PhylogenyNode( "NM_001030253" );
+ SequenceDbWsTools.obtainSeqInformation( n2 );
+ if ( !n2.getNodeData().getSequence().getName().equals( "Danio rerio B-cell CLL/lymphoma 2a (bcl2a), mRNA" ) ) {
+ return false;
+ }
+ if ( !n2.getNodeData().getTaxonomy().getScientificName().equals( "Danio rerio" ) ) {
+ return false;
+ }
+ if ( !n2.getNodeData().getSequence().getAccession().getSource().equals( Source.REFSEQ.toString() ) ) {
+ return false;
+ }
+ if ( !n2.getNodeData().getSequence().getAccession().getValue().equals( "NM_001030253" ) ) {
+ return false;
+ }
+ final PhylogenyNode n3 = new PhylogenyNode( "NM_184234.2" );
+ SequenceDbWsTools.obtainSeqInformation( n3 );
+ if ( !n3.getNodeData().getSequence().getName()
+ .equals( "Homo sapiens RNA binding motif protein 39 (RBM39), transcript variant 1, mRNA" ) ) {
+ return false;
+ }
+ if ( !n3.getNodeData().getTaxonomy().getScientificName().equals( "Homo sapiens" ) ) {
+ return false;
+ }
+ if ( !n3.getNodeData().getSequence().getAccession().getSource().equals( Source.REFSEQ.toString() ) ) {
+ return false;
+ }
+ if ( !n3.getNodeData().getSequence().getAccession().getValue().equals( "NM_184234" ) ) {
+ return false;
+ }
+ }
+ catch ( final IOException e ) {
+ System.out.println();
+ System.out.println( "the following might be due to absence internet connection:" );
+ e.printStackTrace( System.out );
+ return true;
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace();
+ return false;
+ }
+ return true;
+ }
+
private static boolean testSequenceIdParsing() {
try {
- Identifier id = SequenceIdParser.parse( "gb_ADF31344_segmented_worms_" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "ADF31344" ) || !id.getProvider().equals( "ncbi" ) ) {
+ Accession id = SequenceAccessionTools.parseAccessorFromString( "gb_ADF31344_segmented_worms_" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "ADF31344" ) || !id.getSource().equals( "ncbi" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "segmented worms|gb_ADF31344" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "ADF31344" ) || !id.getProvider().equals( "ncbi" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "segmented worms|gb_ADF31344" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "ADF31344" ) || !id.getSource().equals( "ncbi" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "segmented worms gb_ADF31344 and more" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "ADF31344" ) || !id.getProvider().equals( "ncbi" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "segmented worms gb_ADF31344 and more" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "ADF31344" ) || !id.getSource().equals( "ncbi" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getSource() );
+ }
+ return false;
+ }
+ id = SequenceAccessionTools.parseAccessorFromString( "gb_AAA96518_1" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "AAA96518" ) || !id.getSource().equals( "ncbi" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getSource() );
+ }
+ return false;
+ }
+ id = SequenceAccessionTools.parseAccessorFromString( "gb_EHB07727_1_rodents_" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "EHB07727" ) || !id.getSource().equals( "ncbi" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "gb_AAA96518_1" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "AAA96518" ) || !id.getProvider().equals( "ncbi" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "dbj_BAF37827_1_turtles_" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "BAF37827" ) || !id.getSource().equals( "ncbi" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "gb_EHB07727_1_rodents_" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "EHB07727" ) || !id.getProvider().equals( "ncbi" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "emb_CAA73223_1_primates_" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "CAA73223" ) || !id.getSource().equals( "ncbi" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "dbj_BAF37827_1_turtles_" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "BAF37827" ) || !id.getProvider().equals( "ncbi" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "mites|ref_XP_002434188_1" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "XP_002434188" ) || !id.getSource().equals( "refseq" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "emb_CAA73223_1_primates_" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "CAA73223" ) || !id.getProvider().equals( "ncbi" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "mites_ref_XP_002434188_1_bla_XP_12345" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "XP_002434188" ) || !id.getSource().equals( "refseq" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "mites|ref_XP_002434188_1" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "XP_002434188" ) || !id.getProvider().equals( "refseq" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "P4A123" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "P4A123" ) || !id.getSource().equals( "uniprot" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "mites_ref_XP_002434188_1_bla_XP_12345" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "XP_002434188" ) || !id.getProvider().equals( "refseq" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "XP_12345" );
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getSource() );
+ return false;
+ }
+ id = SequenceAccessionTools.parseAccessorFromString( "N3B004Z009" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "N3B004Z009" ) || !id.getSource().equals( "uniprot" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "P4A123" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "P4A123" ) || !id.getProvider().equals( "sp" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "A4CAA4ZBB9" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "A4CAA4ZBB9" ) || !id.getSource().equals( "uniprot" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "pllf[pok P4A123_osdjfosnqo035-9233332904i000490 vf tmv x45" );
- if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
- || !id.getValue().equals( "P4A123" ) || !id.getProvider().equals( "sp" ) ) {
+ id = SequenceAccessionTools.parseAccessorFromString( "ecoli_A4CAA4ZBB9_rt" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getSource() )
+ || !id.getValue().equals( "A4CAA4ZBB9" ) || !id.getSource().equals( "uniprot" ) ) {
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
}
return false;
}
- //
- id = SequenceIdParser.parse( "XP_12345" );
+ id = SequenceAccessionTools.parseAccessorFromString( "Q4CAA4ZBB9" );
if ( id != null ) {
System.out.println( "value =" + id.getValue() );
- System.out.println( "provider=" + id.getProvider() );
+ System.out.println( "provider=" + id.getSource() );
return false;
}
- // lcl_91970_unknown_
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
if ( !s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "F" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "G" ) );
if ( !s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "E" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "D" ) );
if ( !s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "F" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "G" ) );
if ( !s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "F" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "G" ) );
if ( !s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "F" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "E" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "F" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "G" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "B" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "D" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "B" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "C" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "E" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "F" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "G" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "F" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "A" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "B" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "E" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "D" ) );
if ( s0.match( query_nodes ) ) {
return false;
}
- //
query_nodes = new HashSet<PhylogenyNode>();
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "E" ) );
query_nodes.add( PhylogenyNode.createInstanceFromNhxString( "D" ) );
final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
final Phylogeny t0_1 = factory.create( "(((A,B),C),(D,E))", new NHXParser() )[ 0 ];
final Phylogeny[] phylogenies_1 = factory.create( "(((A,B),C),(D,E)) " + "(((C,B),A),(D,E))"
- + "(((A,B),C),(D,E)) " + "(((A,B),C),(D,E))"
- + "(((A,B),C),(D,E))" + "(((C,B),A),(D,E))"
- + "(((E,B),D),(C,A))" + "(((C,B),A),(D,E))"
- + "(((A,B),C),(D,E))" + "(((A,B),C),(D,E))",
- new NHXParser() );
+ + "(((A,B),C),(D,E)) " + "(((A,B),C),(D,E))"
+ + "(((A,B),C),(D,E))" + "(((C,B),A),(D,E))"
+ + "(((E,B),D),(C,A))" + "(((C,B),A),(D,E))"
+ + "(((A,B),C),(D,E))" + "(((A,B),C),(D,E))",
+ new NHXParser() );
SupportCount.count( t0_1, phylogenies_1, true, false );
final Phylogeny t0_2 = factory.create( "(((((A,B),C),D),E),(F,G))", new NHXParser() )[ 0 ];
final Phylogeny[] phylogenies_2 = factory.create( "(((((A,B),C),D),E),(F,G))"
- + "(((((A,B),C),D),E),((F,G),X))"
- + "(((((A,Y),B),C),D),((F,G),E))"
- + "(((((A,B),C),D),E),(F,G))"
- + "(((((A,B),C),D),E),(F,G))"
- + "(((((A,B),C),D),E),(F,G))"
- + "(((((A,B),C),D),E),(F,G),Z)"
- + "(((((A,B),C),D),E),(F,G))"
- + "((((((A,B),C),D),E),F),G)"
- + "(((((X,Y),F,G),E),((A,B),C)),D)",
- new NHXParser() );
+ + "(((((A,B),C),D),E),((F,G),X))"
+ + "(((((A,Y),B),C),D),((F,G),E))"
+ + "(((((A,B),C),D),E),(F,G))"
+ + "(((((A,B),C),D),E),(F,G))"
+ + "(((((A,B),C),D),E),(F,G))"
+ + "(((((A,B),C),D),E),(F,G),Z)"
+ + "(((((A,B),C),D),E),(F,G))"
+ + "((((((A,B),C),D),E),F),G)"
+ + "(((((X,Y),F,G),E),((A,B),C)),D)",
+ new NHXParser() );
SupportCount.count( t0_2, phylogenies_2, true, false );
final PhylogenyNodeIterator it = t0_2.iteratorPostorder();
while ( it.hasNext() ) {
return false;
}
final PhylogenyNode n3 = PhylogenyNode
- .createInstanceFromNhxString( "blag_12345", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BLAG_12345", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( !n3.getNodeData().getTaxonomy().getIdentifier().getValue().equals( "12345" ) ) {
System.out.println( n3.toString() );
return false;
return false;
}
final PhylogenyNode n6 = PhylogenyNode
- .createInstanceFromNhxString( "blag-12345-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BLAG-12345-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( n6.getNodeData().isHasTaxonomy() ) {
System.out.println( n6.toString() );
return false;
}
final PhylogenyNode n7 = PhylogenyNode
- .createInstanceFromNhxString( "blag-12345_blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BLAG-12345_blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( n7.getNodeData().isHasTaxonomy() ) {
System.out.println( n7.toString() );
return false;
}
final PhylogenyNode n8 = PhylogenyNode
- .createInstanceFromNhxString( "blag_12345-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BLAG_12345-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( !n8.getNodeData().getTaxonomy().getIdentifier().getValue().equals( "12345" ) ) {
System.out.println( n8.toString() );
return false;
}
final PhylogenyNode n9 = PhylogenyNode
- .createInstanceFromNhxString( "blag_12345/blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BLAG_12345/blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( !n9.getNodeData().getTaxonomy().getIdentifier().getValue().equals( "12345" ) ) {
System.out.println( n9.toString() );
return false;
}
final PhylogenyNode n10x = PhylogenyNode
- .createInstanceFromNhxString( "blag_12X45-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BLAG_12X45-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( n10x.getNodeData().isHasTaxonomy() ) {
System.out.println( n10x.toString() );
return false;
}
final PhylogenyNode n10xx = PhylogenyNode
- .createInstanceFromNhxString( "blag_1YX45-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BLAG_1YX45-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( n10xx.getNodeData().isHasTaxonomy() ) {
System.out.println( n10xx.toString() );
return false;
}
final PhylogenyNode n10 = PhylogenyNode
- .createInstanceFromNhxString( "blag_9YX45-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
+ .createInstanceFromNhxString( "BLAG_9YX45-blag", NHXParser.TAXONOMY_EXTRACTION.PFAM_STYLE_RELAXED );
if ( !n10.getNodeData().getTaxonomy().getTaxonomyCode().equals( "9YX45" ) ) {
System.out.println( n10.toString() );
return false;
System.out.println( n13.toString() );
return false;
}
+ final PhylogenyNode n14 = PhylogenyNode
+ .createInstanceFromNhxString( "Mus_musculus_392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n14.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus" ) ) {
+ System.out.println( n14.toString() );
+ return false;
+ }
+ final PhylogenyNode n15 = PhylogenyNode
+ .createInstanceFromNhxString( "Mus_musculus_K392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n15.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus" ) ) {
+ System.out.println( n15.toString() );
+ return false;
+ }
+ final PhylogenyNode n16 = PhylogenyNode
+ .createInstanceFromNhxString( "Mus musculus 392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n16.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus" ) ) {
+ System.out.println( n16.toString() );
+ return false;
+ }
+ final PhylogenyNode n17 = PhylogenyNode
+ .createInstanceFromNhxString( "Mus musculus K392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n17.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus" ) ) {
+ System.out.println( n17.toString() );
+ return false;
+ }
+ final PhylogenyNode n18 = PhylogenyNode
+ .createInstanceFromNhxString( "Mus_musculus_musculus_392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n18.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus musculus" ) ) {
+ System.out.println( n18.toString() );
+ return false;
+ }
+ final PhylogenyNode n19 = PhylogenyNode
+ .createInstanceFromNhxString( "Mus_musculus_musculus_K392",
+ NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n19.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus musculus" ) ) {
+ System.out.println( n19.toString() );
+ return false;
+ }
+ final PhylogenyNode n20 = PhylogenyNode
+ .createInstanceFromNhxString( "Mus musculus musculus 392", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n20.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus musculus" ) ) {
+ System.out.println( n20.toString() );
+ return false;
+ }
+ final PhylogenyNode n21 = PhylogenyNode
+ .createInstanceFromNhxString( "Mus musculus musculus K392",
+ NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n21.getNodeData().getTaxonomy().getScientificName().equals( "Mus musculus musculus" ) ) {
+ System.out.println( n21.toString() );
+ return false;
+ }
+ final PhylogenyNode n23 = PhylogenyNode
+ .createInstanceFromNhxString( "9EMVE_Nematostella_vectensis",
+ NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n23.getNodeData().getTaxonomy().getScientificName().equals( "Nematostella vectensis" ) ) {
+ System.out.println( n23.toString() );
+ return false;
+ }
+ final PhylogenyNode n24 = PhylogenyNode
+ .createInstanceFromNhxString( "9EMVE_Nematostella", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n24.getNodeData().getTaxonomy().getTaxonomyCode().equals( "9EMVE" ) ) {
+ System.out.println( n24.toString() );
+ return false;
+ }
+ //
+ final PhylogenyNode n25 = PhylogenyNode
+ .createInstanceFromNhxString( "Nematostella_vectensis_NEMVE",
+ NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n25.getNodeData().getTaxonomy().getTaxonomyCode().equals( "NEMVE" ) ) {
+ System.out.println( n25.toString() );
+ return false;
+ }
+ final PhylogenyNode n26 = PhylogenyNode
+ .createInstanceFromNhxString( "Nematostella_vectensis_9EMVE",
+ NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n26.getNodeData().getTaxonomy().getScientificName().equals( "Nematostella vectensis" ) ) {
+ System.out.println( n26.toString() );
+ return false;
+ }
+ final PhylogenyNode n27 = PhylogenyNode
+ .createInstanceFromNhxString( "Nematostella_9EMVE", NHXParser.TAXONOMY_EXTRACTION.AGGRESSIVE );
+ if ( !n27.getNodeData().getTaxonomy().getTaxonomyCode().equals( "9EMVE" ) ) {
+ System.out.println( n27.toString() );
+ return false;
+ }
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
return true;
}
+ private static boolean testTreeCopy() {
+ try {
+ final String str_0 = "((((a,b),c),d)[&&NHX:S=lizards],e[&&NHX:S=reptiles])r[&&NHX:S=animals]";
+ final Phylogeny t0 = Phylogeny.createInstanceFromNhxString( str_0 );
+ final Phylogeny t1 = t0.copy();
+ if ( !t1.toNewHampshireX().equals( t0.toNewHampshireX() ) ) {
+ return false;
+ }
+ if ( !t1.toNewHampshireX().equals( str_0 ) ) {
+ return false;
+ }
+ t0.deleteSubtree( t0.getNode( "c" ), true );
+ t0.deleteSubtree( t0.getNode( "a" ), true );
+ t0.getRoot().getNodeData().getTaxonomy().setScientificName( "metazoa" );
+ t0.getNode( "b" ).setName( "Bee" );
+ if ( !t0.toNewHampshireX().equals( "((Bee,d)[&&NHX:S=lizards],e[&&NHX:S=reptiles])r[&&NHX:S=metazoa]" ) ) {
+ return false;
+ }
+ if ( !t1.toNewHampshireX().equals( str_0 ) ) {
+ return false;
+ }
+ t0.deleteSubtree( t0.getNode( "e" ), true );
+ t0.deleteSubtree( t0.getNode( "Bee" ), true );
+ t0.deleteSubtree( t0.getNode( "d" ), true );
+ if ( !t1.toNewHampshireX().equals( str_0 ) ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace();
+ return false;
+ }
+ return true;
+ }
+
private static boolean testTreeMethods() {
try {
final PhylogenyFactory factory = ParserBasedPhylogenyFactory.getInstance();
private static boolean testUniprotEntryRetrieval() {
try {
- final SequenceDatabaseEntry entry = SequenceDbWsTools.obtainUniProtEntry( "P12345", 200 );
+ final SequenceDatabaseEntry entry = SequenceDbWsTools.obtainUniProtEntry( "P12345", 5000 );
if ( !entry.getAccession().equals( "P12345" ) ) {
return false;
}
if ( !entry.getSequenceName().equals( "Aspartate aminotransferase, mitochondrial" ) ) {
return false;
}
+ if ( !entry.getSequenceSymbol().equals( "mAspAT" ) ) {
+ return false;
+ }
+ if ( !entry.getGeneName().equals( "GOT2" ) ) {
+ return false;
+ }
if ( !entry.getTaxonomyIdentifier().equals( "9986" ) ) {
return false;
}
+ if ( entry.getMolecularSequence() == null ) {
+ return false;
+ }
+ if ( !entry
+ .getMolecularSequence()
+ .getMolecularSequenceAsString()
+ .startsWith( "MALLHSARVLSGVASAFHPGLAAAASARASSWWAHVEMGPPDPILGVTEAYKRDTNSKKMNLGVGAYRDDNGKPYVLPSVRKAEAQIAAKGLDKEYLPIGGLAEFCRASAELALGENSEV" )
+ || !entry.getMolecularSequence().getMolecularSequenceAsString().endsWith( "LAHAIHQVTK" ) ) {
+ System.out.println( "got: " + entry.getMolecularSequence().getMolecularSequenceAsString() );
+ System.out.println( "expected something else." );
+ return false;
+ }
}
catch ( final IOException e ) {
System.out.println();
e.printStackTrace( System.out );
return true;
}
+ catch ( final NullPointerException f ) {
+ f.printStackTrace( System.out );
+ return false;
+ }
catch ( final Exception e ) {
return false;
}