import org.forester.io.parsers.phyloxml.PhyloXmlParser;
import org.forester.io.parsers.tol.TolParser;
import org.forester.io.writers.PhylogenyWriter;
+import org.forester.msa.BasicMsa;
import org.forester.msa.Mafft;
import org.forester.msa.Msa;
import org.forester.msa.MsaInferrer;
+import org.forester.msa.MsaMethods;
import org.forester.pccx.TestPccx;
import org.forester.phylogeny.Phylogeny;
import org.forester.phylogeny.PhylogenyBranch;
import org.forester.phylogeny.factories.ParserBasedPhylogenyFactory;
import org.forester.phylogeny.factories.PhylogenyFactory;
import org.forester.phylogeny.iterators.PhylogenyNodeIterator;
+import org.forester.protein.Protein;
import org.forester.sdi.SDI;
import org.forester.sdi.SDIR;
import org.forester.sdi.SDIse;
-import org.forester.sdi.TaxonomyAssigner;
import org.forester.sdi.TestGSDI;
import org.forester.sequence.BasicSequence;
import org.forester.sequence.Sequence;
-import org.forester.surfacing.Protein;
import org.forester.surfacing.TestSurfacing;
import org.forester.tools.ConfidenceAssessor;
import org.forester.tools.SupportCount;
import org.forester.util.ForesterConstants;
import org.forester.util.ForesterUtil;
import org.forester.util.GeneralTable;
-import org.forester.ws.uniprot.DatabaseTools;
-import org.forester.ws.uniprot.SequenceDatabaseEntry;
-import org.forester.ws.uniprot.UniProtTaxonomy;
-import org.forester.ws.uniprot.UniProtWsTools;
+import org.forester.util.SequenceIdParser;
+import org.forester.ws.seqdb.SequenceDatabaseEntry;
+import org.forester.ws.seqdb.SequenceDbWsTools;
+import org.forester.ws.seqdb.UniProtTaxonomy;
import org.forester.ws.wabi.TxSearch;
import org.forester.ws.wabi.TxSearch.RANKS;
import org.forester.ws.wabi.TxSearch.TAX_NAME_CLASS;
System.exit( -1 );
}
final long start_time = new Date().getTime();
+ System.out.print( "Sequence id parsing: " );
+ if ( testSequenceIdParsing() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ System.exit( -1 ); //TODO FIXME remove me!! ~
+ failed++;
+ }
System.out.print( "Hmmscan output parser: " );
if ( testHmmscanOutputParser() ) {
System.out.println( "OK." );
System.out.println( "failed." );
failed++;
}
- System.out.print( "Taxonomy assigner: " );
- if ( Test.testTaxonomyAssigner() ) {
- System.out.println( "OK." );
- succeeded++;
- }
- else {
- System.out.println( "failed." );
- failed++;
- }
System.out.print( "SDIunrooted: " );
if ( Test.testSDIunrooted() ) {
System.out.println( "OK." );
System.out.println( "failed." );
failed++;
}
+ System.out.print( "Simple MSA quality: " );
+ if ( Test.testMsaQualityMethod() ) {
+ System.out.println( "OK." );
+ succeeded++;
+ }
+ else {
+ System.out.println( "failed." );
+ failed++;
+ }
// System.out.print( "WABI TxSearch: " );
// if ( Test.testWabiTxSearch() ) {
// System.out.println( "OK." );
return false;
}
final PhylogenyNode n = t3.getNode( "ABC" );
- PhylogenyNodeIterator it;
- for( it = n.iterateChildNodesForward(); it.hasNext(); ) {
- it.next();
- }
- for( it.reset(); it.hasNext(); ) {
- it.next();
- }
- final PhylogenyNodeIterator it2 = n.iterateChildNodesForward();
- if ( !it2.next().getName().equals( "A" ) ) {
- return false;
- }
- if ( !it2.next().getName().equals( "B" ) ) {
- return false;
- }
- if ( !it2.next().getName().equals( "C" ) ) {
- return false;
- }
- if ( it2.hasNext() ) {
- return false;
- }
final Phylogeny t4 = factory.create( "((A:1,B:2,C:10)ABC:1,(D:3,E:5)DE:3,(F,G,H,I))", new NHXParser() )[ 0 ];
if ( t4.getNumberOfExternalNodes() != 9 ) {
return false;
return false;
}
t2.setIdentifier( new Identifier( "ecoli" ) );
- t2.setTaxonomyCode( "other" );
+ t2.setTaxonomyCode( "OTHER" );
t2.setScientificName( "what" );
t2.setCommonName( "something" );
if ( !t1.isEqual( t2 ) ) {
dss3.addValue( 10 );
final AsciiHistogram histo = new AsciiHistogram( dss3 );
histo.toStringBuffer( 10, '=', 40, 5 );
- histo.toStringBuffer( 3, 8, 10, '=', 40, 5 );
+ histo.toStringBuffer( 3, 8, 10, '=', 40, 5, null );
}
catch ( final Exception e ) {
e.printStackTrace( System.out );
if ( p1.getNumberOfProteinDomains() != 15 ) {
return false;
}
+ if ( p1.getLength() != 850 ) {
+ return false;
+ }
final Protein p2 = proteins.get( 1 );
if ( p2.getNumberOfProteinDomains() != 51 ) {
return false;
}
+ if ( p2.getLength() != 1291 ) {
+ return false;
+ }
final Protein p3 = proteins.get( 2 );
if ( p3.getNumberOfProteinDomains() != 2 ) {
return false;
if ( PhylogenyMethods.getSpecies( n23 ).length() > 0 ) {
return false;
}
- if ( NHXParser.LIMIT_SPECIES_NAMES_TO_FIVE_CHARS ) {
- final PhylogenyNode a = PhylogenyNode
- .createInstanceFromNhxString( "n10_ECOLI/1-2",
- PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
- if ( !a.getName().equals( "n10_ECOLI/1-2" ) ) {
- return false;
- }
- if ( !PhylogenyMethods.getSpecies( a ).equals( "ECOLI" ) ) {
- return false;
- }
- final PhylogenyNode b = PhylogenyNode
- .createInstanceFromNhxString( "n10_ECOLI1/1-2",
- PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
- if ( !b.getName().equals( "n10_ECOLI1/1-2" ) ) {
- return false;
- }
- if ( !PhylogenyMethods.getSpecies( b ).equals( "ECOLI" ) ) {
- return false;
- }
- final PhylogenyNode c = PhylogenyNode
- .createInstanceFromNhxString( "n10_RATAF12/1000-2000",
- PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
- if ( !c.getName().equals( "n10_RATAF12/1000-2000" ) ) {
- return false;
- }
- if ( !PhylogenyMethods.getSpecies( c ).equals( "RATAF" ) ) {
- return false;
- }
- final PhylogenyNode d = PhylogenyNode
- .createInstanceFromNhxString( "n10_RAT1/1-2",
- PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
- if ( !d.getName().equals( "n10_RAT1/1-2" ) ) {
- return false;
- }
- if ( !PhylogenyMethods.getSpecies( d ).equals( "RAT" ) ) {
- return false;
- }
- final PhylogenyNode e = PhylogenyNode
- .createInstanceFromNhxString( "n10_RAT1", PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
- if ( !e.getName().equals( "n10_RAT1" ) ) {
- return false;
- }
- if ( !ForesterUtil.isEmpty( PhylogenyMethods.getSpecies( e ) ) ) {
- return false;
- }
+ final PhylogenyNode a = PhylogenyNode
+ .createInstanceFromNhxString( "n10_ECOLI/1-2", PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
+ if ( !a.getName().equals( "n10_ECOLI/1-2" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( a ).equals( "ECOLI" ) ) {
+ return false;
+ }
+ final PhylogenyNode b = PhylogenyNode
+ .createInstanceFromNhxString( "n10_ECOLI1/1-2",
+ PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
+ if ( !b.getName().equals( "n10_ECOLI1/1-2" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( b ).equals( "ECOLI" ) ) {
+ return false;
+ }
+ final PhylogenyNode c = PhylogenyNode
+ .createInstanceFromNhxString( "n10_RATAF12/1000-2000",
+ PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
+ if ( !c.getName().equals( "n10_RATAF12/1000-2000" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( c ).equals( "RATAF" ) ) {
+ return false;
+ }
+ final PhylogenyNode c1 = PhylogenyNode
+ .createInstanceFromNhxString( "n10_BOVIN_1/1000-2000",
+ PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
+ if ( !c1.getName().equals( "n10_BOVIN_1/1000-2000" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( c1 ).equals( "BOVIN" ) ) {
+ return false;
+ }
+ final PhylogenyNode c2 = PhylogenyNode
+ .createInstanceFromNhxString( "n10_Bovin_1/1000-2000",
+ PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
+ if ( !c2.getName().equals( "n10_Bovin_1/1000-2000" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( c2 ).equals( "" ) ) {
+ return false;
+ }
+ final PhylogenyNode d = PhylogenyNode
+ .createInstanceFromNhxString( "n10_RAT1/1-2", PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
+ if ( !d.getName().equals( "n10_RAT1/1-2" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( d ).equals( "RAT" ) ) {
+ return false;
+ }
+ final PhylogenyNode e = PhylogenyNode
+ .createInstanceFromNhxString( "n10_RAT1", PhylogenyMethods.TAXONOMY_EXTRACTION.PFAM_STYLE_ONLY );
+ if ( !e.getName().equals( "n10_RAT1" ) ) {
+ return false;
+ }
+ if ( !ForesterUtil.isEmpty( PhylogenyMethods.getSpecies( e ) ) ) {
+ return false;
+ }
+ final PhylogenyNode e2 = PhylogenyNode
+ .createInstanceFromNhxString( "n10_RAT1", PhylogenyMethods.TAXONOMY_EXTRACTION.YES );
+ if ( !e2.getName().equals( "n10_RAT1" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( e2 ).equals( "RAT" ) ) {
+ return false;
+ }
+ final PhylogenyNode e3 = PhylogenyNode
+ .createInstanceFromNhxString( "n10_RAT~", PhylogenyMethods.TAXONOMY_EXTRACTION.YES );
+ if ( !e3.getName().equals( "n10_RAT~" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( e3 ).equals( "RAT" ) ) {
+ return false;
}
final PhylogenyNode n11 = PhylogenyNode
.createInstanceFromNhxString( "n111111_ECOLI/jdj:0.4",
if ( PhylogenyMethods.getSpecies( n12 ).length() > 0 ) {
return false;
}
+ final PhylogenyNode m = PhylogenyNode
+ .createInstanceFromNhxString( "n10_MOUSEa", PhylogenyMethods.TAXONOMY_EXTRACTION.YES );
+ if ( !m.getName().equals( "n10_MOUSEa" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( m ).equals( "MOUSE" ) ) {
+ return false;
+ }
+ final PhylogenyNode o = PhylogenyNode
+ .createInstanceFromNhxString( "n10_MOUSE_", PhylogenyMethods.TAXONOMY_EXTRACTION.YES );
+ if ( !o.getName().equals( "n10_MOUSE_" ) ) {
+ return false;
+ }
+ if ( !PhylogenyMethods.getSpecies( o ).equals( "MOUSE" ) ) {
+ return false;
+ }
final Property tvu1 = n5.getNodeData().getProperties().getProperty( "tag1" );
final Property tvu3 = n5.getNodeData().getProperties().getProperty( "tag3" );
if ( !tvu1.getRef().equals( "tag1" ) ) {
if ( !n13.getName().equals( "blah_12345/1-2" ) ) {
return false;
}
- if ( !PhylogenyMethods.getSpecies( n13 ).equals( "" ) ) {
+ if ( !PhylogenyMethods.getSpecies( n13 ).equals( "12345" ) ) {
return false;
}
final PhylogenyNode n14 = PhylogenyNode
return true;
}
- private static boolean testTaxonomyAssigner() {
- try {
- String s0_str = "(((([&&NHX:S=A],[&&NHX:S=B])[&&NHX:S=AB],[&&NHX:S=C])[&&NHX:S=ABC],[&&NHX:S=D])[&&NHX:S=ABCD],[&&NHX:S=E])[&&NHX:S=ABCDE]";
- String g0_str = "((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=A])a,[&&NHX:S=B])b,[&&NHX:S=C])c";
- Phylogeny s0 = ParserBasedPhylogenyFactory.getInstance().create( s0_str, new NHXParser() )[ 0 ];
- Phylogeny g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- s0.setRooted( true );
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "A" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "AB" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "ABC" ) ) {
- return false;
- }
- g0_str = "((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=A])a,[&&NHX:S=A])b,[&&NHX:S=A])c";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "A" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "A" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "A" ) ) {
- return false;
- }
- g0_str = "((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=B])a,[&&NHX:S=A])b,[&&NHX:S=A])c";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "AB" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "AB" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "AB" ) ) {
- return false;
- }
- g0_str = "((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=B])a,[&&NHX:S=C])b,[&&NHX:S=A])c";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "AB" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "ABC" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "ABC" ) ) {
- return false;
- }
- g0_str = "((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=B])a,[&&NHX:S=C])b,[&&NHX:S=D])c";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "AB" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "ABC" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- g0_str = "((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=E])a,[&&NHX:S=C])b,[&&NHX:S=D])c";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCDE" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCDE" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCDE" ) ) {
- return false;
- }
- g0_str = "((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=E])a,[&&NHX:S=A])b,[&&NHX:S=A])c";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCDE" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCDE" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCDE" ) ) {
- return false;
- }
- s0_str = "(([&&NHX:S=A],[&&NHX:S=B],[&&NHX:S=C],[&&NHX:S=D])[&&NHX:S=ABCD],"
- + "([&&NHX:S=E],[&&NHX:S=F],[&&NHX:S=G],[&&NHX:S=H])[&&NHX:S=EFGH],"
- + "([&&NHX:S=I],[&&NHX:S=J],[&&NHX:S=K],[&&NHX:S=L])[&&NHX:S=IJKL], "
- + "([&&NHX:S=M],[&&NHX:S=N],[&&NHX:S=O],[&&NHX:S=P])[&&NHX:S=MNOP])[&&NHX:S=ROOT]";
- s0 = ParserBasedPhylogenyFactory.getInstance().create( s0_str, new NHXParser() )[ 0 ];
- s0.setRooted( true );
- g0_str = "(([&&NHX:S=A],[&&NHX:S=B],[&&NHX:S=C],[&&NHX:S=D])a,"
- + "([&&NHX:S=E],[&&NHX:S=F],[&&NHX:S=G],[&&NHX:S=H])b,"
- + "([&&NHX:S=I],[&&NHX:S=J],[&&NHX:S=K],[&&NHX:S=L])c, "
- + "([&&NHX:S=M],[&&NHX:S=N],[&&NHX:S=O],[&&NHX:S=P])d)r";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "EFGH" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "IJKL" ) ) {
- return false;
- }
- if ( !g0.getNode( "d" ).getNodeData().getTaxonomy().getScientificName().equals( "MNOP" ) ) {
- return false;
- }
- if ( !g0.getNode( "r" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- g0_str = "(([&&NHX:S=A],[&&NHX:S=B],[&&NHX:S=A],[&&NHX:S=B])a,"
- + "([&&NHX:S=E],[&&NHX:S=F],[&&NHX:S=F],[&&NHX:S=F])b,"
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=I])c, "
- + "([&&NHX:S=M],[&&NHX:S=N],[&&NHX:S=O],[&&NHX:S=O])d)r";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "EFGH" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "IJKL" ) ) {
- return false;
- }
- if ( !g0.getNode( "d" ).getNodeData().getTaxonomy().getScientificName().equals( "MNOP" ) ) {
- return false;
- }
- if ( !g0.getNode( "r" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- g0_str = "(([&&NHX:S=A],[&&NHX:S=B],[&&NHX:S=A],[&&NHX:S=B])a,"
- + "([&&NHX:S=E],[&&NHX:S=F],[&&NHX:S=F],[&&NHX:S=F])b,"
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])c, "
- + "([&&NHX:S=M],[&&NHX:S=N],[&&NHX:S=A],[&&NHX:S=O])d)r";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "EFGH" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "d" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- if ( !g0.getNode( "r" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- g0_str = "(([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])a,"
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])b,"
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])c, "
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])d)r";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "d" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "r" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- g0_str = "((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=A])a,[&&NHX:S=A])b,[&&NHX:S=A])c";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "A" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "A" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "A" ) ) {
- return false;
- }
- g0_str = "((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=B])a,[&&NHX:S=I])b,[&&NHX:S=J])c";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- g0_str = "(((([&&NHX:S=A],[&&NHX:S=B],[&&NHX:S=C],[&&NHX:S=D])a,"
- + "([&&NHX:S=D],[&&NHX:S=C],[&&NHX:S=B],[&&NHX:S=A])b)ab,"
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])c)abc, "
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])d)r";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "ab" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "abc" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- if ( !g0.getNode( "d" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "r" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- g0_str = "(((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=C],[&&NHX:S=D])a,"
- + "([&&NHX:S=D],[&&NHX:S=D],[&&NHX:S=B],[&&NHX:S=A])b)ab,"
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])c)abc, "
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])d)r";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "ab" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "abc" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- if ( !g0.getNode( "d" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "r" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- g0_str = "(((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=C],[&&NHX:S=D])a,"
- + "([&&NHX:S=D],[&&NHX:S=D],[&&NHX:S=B],[&&NHX:S=A])b)ab,"
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L])c)abc, "
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=A])d)r";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "ab" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "L" ) ) {
- return false;
- }
- if ( !g0.getNode( "abc" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- if ( !g0.getNode( "d" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- if ( !g0.getNode( "r" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- g0_str = "(((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=C],[&&NHX:S=D])a,"
- + "([&&NHX:S=D],[&&NHX:S=D],[&&NHX:S=B],[&&NHX:S=A])b)ab,"
- + "([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=A])c)abc, "
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=A])d)r";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( !g0.getNode( "a" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "b" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "ab" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "A" ) ) {
- return false;
- }
- if ( !g0.getNode( "abc" ).getNodeData().getTaxonomy().getScientificName().equals( "ABCD" ) ) {
- return false;
- }
- if ( !g0.getNode( "d" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- if ( !g0.getNode( "r" ).getNodeData().getTaxonomy().getScientificName().equals( "ROOT" ) ) {
- return false;
- }
- s0_str = "(([&&NHX:S=A],[&&NHX:S=B],[&&NHX:S=C],[&&NHX:S=D]),"
- + "([&&NHX:S=E],[&&NHX:S=F],[&&NHX:S=G],[&&NHX:S=H]),"
- + "([&&NHX:S=I],[&&NHX:S=J],[&&NHX:S=K],[&&NHX:S=L]), "
- + "([&&NHX:S=M],[&&NHX:S=N],[&&NHX:S=O],[&&NHX:S=P]))";
- s0 = ParserBasedPhylogenyFactory.getInstance().create( s0_str, new NHXParser() )[ 0 ];
- s0.setRooted( true );
- g0_str = "(((([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=C],[&&NHX:S=D])a,"
- + "([&&NHX:S=D],[&&NHX:S=D],[&&NHX:S=B],[&&NHX:S=A])b)ab,"
- + "([&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=A],[&&NHX:S=A])c)abc, "
- + "([&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=L],[&&NHX:S=A])d)r";
- g0 = ParserBasedPhylogenyFactory.getInstance().create( g0_str, new NHXParser() )[ 0 ];
- g0.setRooted( true );
- TaxonomyAssigner.execute( g0, s0 );
- if ( g0.getNode( "a" ).getNodeData().isHasTaxonomy() ) {
- return false;
- }
- if ( !g0.getNode( "c" ).getNodeData().getTaxonomy().getScientificName().equals( "A" ) ) {
- return false;
- }
- }
- catch ( final Exception e ) {
- e.printStackTrace( System.out );
- return false;
- }
- return true;
- }
-
private static boolean testUniprotTaxonomySearch() {
try {
- List<UniProtTaxonomy> results = UniProtWsTools
- .getTaxonomiesFromCommonNameStrict( "starlet sea anemone", 10 );
+ List<UniProtTaxonomy> results = SequenceDbWsTools.getTaxonomiesFromCommonNameStrict( "starlet sea anemone",
+ 10 );
if ( results.size() != 1 ) {
return false;
}
return false;
}
results = null;
- results = UniProtWsTools.getTaxonomiesFromScientificNameStrict( "Nematostella vectensis", 10 );
+ results = SequenceDbWsTools.getTaxonomiesFromScientificNameStrict( "Nematostella vectensis", 10 );
if ( results.size() != 1 ) {
return false;
}
return false;
}
results = null;
- results = UniProtWsTools.getTaxonomiesFromId( "45351", 10 );
+ results = SequenceDbWsTools.getTaxonomiesFromId( "45351", 10 );
if ( results.size() != 1 ) {
return false;
}
return false;
}
results = null;
- results = UniProtWsTools.getTaxonomiesFromTaxonomyCode( "NEMVE", 10 );
+ results = SequenceDbWsTools.getTaxonomiesFromTaxonomyCode( "NEMVE", 10 );
if ( results.size() != 1 ) {
return false;
}
//Nucleotide: 1 letter + 5 numerals OR 2 letters + 6 numerals
//Protein: 3 letters + 5 numerals
//http://www.ncbi.nlm.nih.gov/Sequin/acc.html
- if ( !DatabaseTools.parseGenbankAccessor( "AY423861" ).equals( "AY423861" ) ) {
+ if ( !SequenceIdParser.parseGenbankAccessor( "AY423861" ).equals( "AY423861" ) ) {
return false;
}
- if ( !DatabaseTools.parseGenbankAccessor( ".AY423861." ).equals( "AY423861" ) ) {
+ if ( !SequenceIdParser.parseGenbankAccessor( ".AY423861." ).equals( "AY423861" ) ) {
return false;
}
- if ( DatabaseTools.parseGenbankAccessor( "AAY423861" ) != null ) {
+ if ( SequenceIdParser.parseGenbankAccessor( "AAY423861" ) != null ) {
return false;
}
- if ( DatabaseTools.parseGenbankAccessor( "AY4238612" ) != null ) {
+ if ( SequenceIdParser.parseGenbankAccessor( "AY4238612" ) != null ) {
return false;
}
- if ( DatabaseTools.parseGenbankAccessor( "AAY4238612" ) != null ) {
+ if ( SequenceIdParser.parseGenbankAccessor( "AAY4238612" ) != null ) {
return false;
}
- if ( DatabaseTools.parseGenbankAccessor( "Y423861" ) != null ) {
+ if ( SequenceIdParser.parseGenbankAccessor( "Y423861" ) != null ) {
return false;
}
- if ( !DatabaseTools.parseGenbankAccessor( "S12345" ).equals( "S12345" ) ) {
+ if ( !SequenceIdParser.parseGenbankAccessor( "S12345" ).equals( "S12345" ) ) {
return false;
}
- if ( !DatabaseTools.parseGenbankAccessor( "|S12345|" ).equals( "S12345" ) ) {
+ if ( !SequenceIdParser.parseGenbankAccessor( "|S12345|" ).equals( "S12345" ) ) {
return false;
}
- if ( DatabaseTools.parseGenbankAccessor( "|S123456" ) != null ) {
+ if ( SequenceIdParser.parseGenbankAccessor( "|S123456" ) != null ) {
return false;
}
- if ( DatabaseTools.parseGenbankAccessor( "ABC123456" ) != null ) {
+ if ( SequenceIdParser.parseGenbankAccessor( "ABC123456" ) != null ) {
return false;
}
- if ( !DatabaseTools.parseGenbankAccessor( "ABC12345" ).equals( "ABC12345" ) ) {
+ if ( !SequenceIdParser.parseGenbankAccessor( "ABC12345" ).equals( "ABC12345" ) ) {
return false;
}
- if ( !DatabaseTools.parseGenbankAccessor( "&ABC12345&" ).equals( "ABC12345" ) ) {
+ if ( !SequenceIdParser.parseGenbankAccessor( "&ABC12345&" ).equals( "ABC12345" ) ) {
return false;
}
- if ( DatabaseTools.parseGenbankAccessor( "ABCD12345" ) != null ) {
+ if ( SequenceIdParser.parseGenbankAccessor( "ABCD12345" ) != null ) {
return false;
}
return true;
}
private static boolean testUniprotEntryRetrieval() {
- if ( !UniProtWsTools.parseUniProtAccessor( "P12345" ).equals( "P12345" ) ) {
+ if ( !SequenceDbWsTools.parseUniProtAccessor( "P12345" ).equals( "P12345" ) ) {
return false;
}
- if ( UniProtWsTools.parseUniProtAccessor( "EP12345" ) != null ) {
+ if ( SequenceDbWsTools.parseUniProtAccessor( "EP12345" ) != null ) {
return false;
}
- if ( UniProtWsTools.parseUniProtAccessor( "3 4P12345" ) != null ) {
+ if ( SequenceDbWsTools.parseUniProtAccessor( "3 4P12345" ) != null ) {
return false;
}
- if ( UniProtWsTools.parseUniProtAccessor( "P12345E" ) != null ) {
+ if ( SequenceDbWsTools.parseUniProtAccessor( "P12345E" ) != null ) {
return false;
}
- if ( UniProtWsTools.parseUniProtAccessor( "P123455" ) != null ) {
+ if ( SequenceDbWsTools.parseUniProtAccessor( "P123455" ) != null ) {
return false;
}
- if ( UniProtWsTools.parseUniProtAccessor( "EP12345E" ) != null ) {
+ if ( SequenceDbWsTools.parseUniProtAccessor( "EP12345E" ) != null ) {
return false;
}
- if ( UniProtWsTools.parseUniProtAccessor( "AY423861" ) != null ) {
+ if ( SequenceDbWsTools.parseUniProtAccessor( "AY423861" ) != null ) {
return false;
}
- if ( !UniProtWsTools.parseUniProtAccessor( "P1DDD5" ).equals( "P1DDD5" ) ) {
+ if ( !SequenceDbWsTools.parseUniProtAccessor( "P1DDD5" ).equals( "P1DDD5" ) ) {
return false;
}
- if ( UniProtWsTools.parseUniProtAccessor( "P1DDDD" ) != null ) {
+ if ( SequenceDbWsTools.parseUniProtAccessor( "P1DDDD" ) != null ) {
return false;
}
- if ( !UniProtWsTools.parseUniProtAccessor( "P1234X/P12345/12-42" ).equals( "P12345" ) ) {
+ if ( !SequenceDbWsTools.parseUniProtAccessor( "P1234X/P12345/12-42" ).equals( "P12345" ) ) {
return false;
}
- if ( !UniProtWsTools.parseUniProtAccessor( "P1234X P12345 12-42" ).equals( "P12345" ) ) {
+ if ( !SequenceDbWsTools.parseUniProtAccessor( "P1234X P12345 12-42" ).equals( "P12345" ) ) {
return false;
}
- if ( !UniProtWsTools.parseUniProtAccessor( "P12345/12-42" ).equals( "P12345" ) ) {
+ if ( !SequenceDbWsTools.parseUniProtAccessor( "P12345/12-42" ).equals( "P12345" ) ) {
return false;
}
- if ( !UniProtWsTools.parseUniProtAccessor( "P1234X/P12345" ).equals( "P12345" ) ) {
+ if ( !SequenceDbWsTools.parseUniProtAccessor( "P1234X/P12345" ).equals( "P12345" ) ) {
return false;
}
try {
- final SequenceDatabaseEntry entry = UniProtWsTools.obtainUniProtEntry( "P12345", 200 );
+ final SequenceDatabaseEntry entry = SequenceDbWsTools.obtainUniProtEntry( "P12345", 200 );
if ( !entry.getAccession().equals( "P12345" ) ) {
return false;
}
try {
final String msa_str_0 = "seq1 abcd\n\nseq2 efgh\n";
final Msa msa_0 = GeneralMsaParser.parse( new ByteArrayInputStream( msa_str_0.getBytes() ) );
- final String msa_str_1 = "seq_1 abc\nseq2 ghi\nseq_1 def\nseq2 jkm\n";
+ final String msa_str_1 = "seq1 abc\nseq2 ghi\nseq1 def\nseq2 jkm\n";
final Msa msa_1 = GeneralMsaParser.parse( new ByteArrayInputStream( msa_str_1.getBytes() ) );
final String msa_str_2 = "seq1 abc\nseq2 ghi\n\ndef\njkm\n";
final Msa msa_2 = GeneralMsaParser.parse( new ByteArrayInputStream( msa_str_2.getBytes() ) );
final String msa_str_3 = "seq1 abc\n def\nseq2 ghi\n jkm\n";
final Msa msa_3 = GeneralMsaParser.parse( new ByteArrayInputStream( msa_str_3.getBytes() ) );
+ if ( !msa_1.getSequenceAsString( 0 ).toString().equalsIgnoreCase( "abcdef" ) ) {
+ return false;
+ }
+ if ( !msa_1.getSequenceAsString( 1 ).toString().equalsIgnoreCase( "ghixkm" ) ) {
+ return false;
+ }
+ if ( !msa_1.getIdentifier( 0 ).toString().equals( "seq1" ) ) {
+ return false;
+ }
+ if ( !msa_1.getIdentifier( 1 ).toString().equals( "seq2" ) ) {
+ return false;
+ }
+ if ( !msa_2.getSequenceAsString( 0 ).toString().equalsIgnoreCase( "abcdef" ) ) {
+ return false;
+ }
+ if ( !msa_2.getSequenceAsString( 1 ).toString().equalsIgnoreCase( "ghixkm" ) ) {
+ return false;
+ }
+ if ( !msa_2.getIdentifier( 0 ).toString().equals( "seq1" ) ) {
+ return false;
+ }
+ if ( !msa_2.getIdentifier( 1 ).toString().equals( "seq2" ) ) {
+ return false;
+ }
+ if ( !msa_3.getSequenceAsString( 0 ).toString().equalsIgnoreCase( "abcdef" ) ) {
+ return false;
+ }
+ if ( !msa_3.getSequenceAsString( 1 ).toString().equalsIgnoreCase( "ghixkm" ) ) {
+ return false;
+ }
+ if ( !msa_3.getIdentifier( 0 ).toString().equals( "seq1" ) ) {
+ return false;
+ }
+ if ( !msa_3.getIdentifier( 1 ).toString().equals( "seq2" ) ) {
+ return false;
+ }
final Msa msa_4 = GeneralMsaParser.parse( new FileInputStream( PATH_TO_TEST_DATA + "msa_1.txt" ) );
if ( !msa_4.getSequenceAsString( 0 ).toString().equalsIgnoreCase( "abcdefeeeeeeeexx" ) ) {
return false;
Msa msa = null;
final MsaInferrer mafft = Mafft.createInstance();
msa = mafft.infer( new File( PATH_TO_TEST_DATA + "ncbi_sn.fasta" ), opts );
- if ( ( msa == null ) || ( msa.getLength() < 10 ) || ( msa.getNumberOfSequences() != 19 ) ) {
+ if ( ( msa == null ) || ( msa.getLength() < 20 ) || ( msa.getNumberOfSequences() != 19 ) ) {
+ return false;
+ }
+ if ( !msa.getIdentifier( 0 ).toString().equals( "a" ) ) {
return false;
}
}
}
return true;
}
+
+ private static boolean testMsaQualityMethod() {
+ try {
+ final Sequence s0 = BasicSequence.createAaSequence( "a", "ABAXEFGHIJ" );
+ final Sequence s1 = BasicSequence.createAaSequence( "a", "ABBXEFGHIJ" );
+ final Sequence s2 = BasicSequence.createAaSequence( "a", "AXCXEFGHIJ" );
+ final Sequence s3 = BasicSequence.createAaSequence( "a", "AXDDEFGHIJ" );
+ final List<Sequence> l = new ArrayList<Sequence>();
+ l.add( s0 );
+ l.add( s1 );
+ l.add( s2 );
+ l.add( s3 );
+ final Msa msa = BasicMsa.createInstance( l );
+ if ( !isEqual( 1, MsaMethods.calculateIdentityRatio( msa, 0 ) ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.5, MsaMethods.calculateIdentityRatio( msa, 1 ) ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.25, MsaMethods.calculateIdentityRatio( msa, 2 ) ) ) {
+ return false;
+ }
+ if ( !isEqual( 0.75, MsaMethods.calculateIdentityRatio( msa, 3 ) ) ) {
+ return false;
+ }
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace( System.out );
+ return false;
+ }
+ return true;
+ }
+
+ private static boolean testSequenceIdParsing() {
+ try {
+ Identifier id = SequenceIdParser.parse( "gb_ADF31344_segmented_worms_" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
+ || !id.getValue().equals( "ADF31344" ) || !id.getProvider().equals( "ncbi" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getProvider() );
+ }
+ return false;
+ }
+ //
+ id = SequenceIdParser.parse( "segmented worms|gb_ADF31344" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
+ || !id.getValue().equals( "ADF31344" ) || !id.getProvider().equals( "ncbi" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getProvider() );
+ }
+ return false;
+ }
+ //
+ id = SequenceIdParser.parse( "segmented worms gb_ADF31344 and more" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
+ || !id.getValue().equals( "ADF31344" ) || !id.getProvider().equals( "ncbi" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getProvider() );
+ }
+ return false;
+ }
+ //
+ id = SequenceIdParser.parse( "gb_AAA96518_1" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
+ || !id.getValue().equals( "AAA96518" ) || !id.getProvider().equals( "ncbi" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getProvider() );
+ }
+ return false;
+ }
+ //
+ id = SequenceIdParser.parse( "gb_EHB07727_1_rodents_" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
+ || !id.getValue().equals( "EHB07727" ) || !id.getProvider().equals( "ncbi" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getProvider() );
+ }
+ return false;
+ }
+ //
+ id = SequenceIdParser.parse( "dbj_BAF37827_1_turtles_" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
+ || !id.getValue().equals( "BAF37827" ) || !id.getProvider().equals( "ncbi" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getProvider() );
+ }
+ return false;
+ }
+ //
+ id = SequenceIdParser.parse( "emb_CAA73223_1_primates_" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
+ || !id.getValue().equals( "CAA73223" ) || !id.getProvider().equals( "ncbi" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getProvider() );
+ }
+ return false;
+ }
+ //
+ id = SequenceIdParser.parse( "mites|ref_XP_002434188_1" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
+ || !id.getValue().equals( "XP_002434188" ) || !id.getProvider().equals( "refseq" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getProvider() );
+ }
+ return false;
+ }
+ //
+ id = SequenceIdParser.parse( "mites_ref_XP_002434188_1_bla_XP_12345" );
+ if ( ( id == null ) || ForesterUtil.isEmpty( id.getValue() ) || ForesterUtil.isEmpty( id.getProvider() )
+ || !id.getValue().equals( "XP_002434188" ) || !id.getProvider().equals( "refseq" ) ) {
+ if ( id != null ) {
+ System.out.println( "value =" + id.getValue() );
+ System.out.println( "provider=" + id.getProvider() );
+ }
+ return false;
+ }
+ //
+ id = SequenceIdParser.parse( "XP_12345" );
+ if ( id != null ) {
+ return false;
+ }
+ // lcl_91970_unknown_
+ }
+ catch ( final Exception e ) {
+ e.printStackTrace( System.out );
+ return false;
+ }
+ return true;
+ }
}