X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=forester%2Fjava%2Fsrc%2Forg%2Fforester%2Fapplication%2Fsurfacing.java;h=095f730e94934869b7af20c0a49c22e6775b2028;hb=299c529fea070487998aee60ed7810af57f3a071;hp=d83fdf74b8d907271a19618705c0687176bc5561;hpb=87d34f343d0262cd0c009c6f1da058a5a217bc64;p=jalview.git diff --git a/forester/java/src/org/forester/application/surfacing.java b/forester/java/src/org/forester/application/surfacing.java index d83fdf7..095f730 100644 --- a/forester/java/src/org/forester/application/surfacing.java +++ b/forester/java/src/org/forester/application/surfacing.java @@ -187,6 +187,9 @@ public class surfacing { final static private String MAX_ALLOWED_OVERLAP_OPTION = "mo"; final static private String NO_ENGULFING_OVERLAP_OPTION = "no_eo"; final static private String IGNORE_COMBINATION_WITH_SAME_OPTION = "ignore_self_comb"; + final static private String PERFORM_DC_REGAIN_PROTEINS_STATS_OPTION = "dc_regain_stats"; + final static private String DA_ANALYSIS_OPTION = "DA_analyis"; + final static private String USE_LAST_IN_FITCH_OPTION = "last"; final static private String PAIRWISE_DOMAIN_COMPARISONS_PREFIX = "pwc_"; final static private String PAIRWISE_DOMAIN_COMPARISONS_OPTION = "pwc"; final static private String OUTPUT_FILE_OPTION = "o"; @@ -216,22 +219,16 @@ public class surfacing { + ForesterConstants.PHYLO_XML_SUFFIX; final static private String NJ_TREE_SHARED_BIN_COMBINATIONS_BASED_GENOME_DISTANCE_SUFFIX = "_bin_combinations_NJ" + ForesterConstants.PHYLO_XML_SUFFIX; - final static private String JACKNIFE_OPTION = "jack"; - final static private String JACKNIFE_RANDOM_SEED_OPTION = "seed"; - final static private String JACKNIFE_RATIO_OPTION = "jack_ratio"; - private static final int JACKNIFE_NUMBER_OF_RESAMPLINGS_DEFAULT = 100; - final static private long JACKNIFE_RANDOM_SEED_DEFAULT = 19; - final static private double JACKNIFE_RATIO_DEFAULT = 0.5; final static private String FILTER_POSITIVE_OPTION = "pos_filter"; final static private String FILTER_NEGATIVE_OPTION = "neg_filter"; final static private String FILTER_NEGATIVE_DOMAINS_OPTION = "neg_dom_filter"; final static private String INPUT_GENOMES_FILE_OPTION = "genomes"; final static private String INPUT_SPECIES_TREE_OPTION = "species_tree"; final static private String SEQ_EXTRACT_OPTION = "prot_extract"; - final static private String PRG_VERSION = "2.280"; - final static private String PRG_DATE = "130701"; + final static private String PRG_VERSION = "2.302"; + final static private String PRG_DATE = "130715"; final static private String E_MAIL = "czmasek@burnham.org"; - final static private String WWW = "www.phylosoft.org/forester/applications/surfacing"; + final static private String WWW = "https://sites.google.com/site/cmzmasek/home/software/forester/surfacing"; final static private boolean IGNORE_DUFS_DEFAULT = true; final static private boolean IGNORE_COMBINATION_WITH_SAME_DEFAULLT = false; final static private double MAX_E_VALUE_DEFAULT = -1; @@ -281,8 +278,7 @@ public class surfacing { public static final String INDEPENDENT_DC_GAINS_FITCH_PARS_DC_MAPPED_OUTPUT_SUFFIX = "_indep_dc_gains_fitch_lists_MAPPED.txt"; public static final String INDEPENDENT_DC_GAINS_FITCH_PARS_DC_FOR_GO_MAPPING_MAPPED_OUTPUT_SUFFIX = "_indep_dc_gains_fitch_lists_for_go_mapping_MAPPED.txt"; public static final String INDEPENDENT_DC_GAINS_FITCH_PARS_DC_FOR_GO_MAPPING_MAPPED_OUTPUT_UNIQUE_SUFFIX = "_indep_dc_gains_fitch_lists_for_go_mapping_unique_MAPPED.txt"; - private static final boolean PERFORM_DC_REGAIN_PROTEINS_STATS = true; - private static final boolean DA_ANALYSIS = false; + private static final boolean CALC_SIMILARITY_SCORES = false; private static void checkWriteabilityForPairwiseComparisons( final PrintableDomainSimilarity.PRINT_OPTION domain_similarity_print_option, final String[][] input_file_properties, @@ -605,9 +601,6 @@ public class surfacing { allowed_options.add( surfacing.PAIRWISE_DOMAIN_COMPARISONS_OPTION ); allowed_options.add( surfacing.IGNORE_DOMAINS_WITHOUT_COMBINATIONS_IN_ALL_SPECIES_OPTION ); allowed_options.add( surfacing.CONSIDER_DOMAIN_COMBINATION_DIRECTEDNESS ); - allowed_options.add( JACKNIFE_OPTION ); - allowed_options.add( JACKNIFE_RANDOM_SEED_OPTION ); - allowed_options.add( JACKNIFE_RATIO_OPTION ); allowed_options.add( INPUT_SPECIES_TREE_OPTION ); allowed_options.add( FILTER_POSITIVE_OPTION ); allowed_options.add( FILTER_NEGATIVE_OPTION ); @@ -623,6 +616,9 @@ public class surfacing { allowed_options.add( OUTPUT_LIST_OF_ALL_PROTEINS_OPTIONS ); allowed_options.add( CONSIDER_DOMAIN_COMBINATION_DIRECTEDNESS_AND_ADJACENCY ); allowed_options.add( WRITE_TO_NEXUS_OPTION ); + allowed_options.add( PERFORM_DC_REGAIN_PROTEINS_STATS_OPTION ); + allowed_options.add( DA_ANALYSIS_OPTION ); + allowed_options.add( USE_LAST_IN_FITCH_OPTION ); boolean ignore_dufs = surfacing.IGNORE_DUFS_DEFAULT; boolean ignore_combination_with_same = surfacing.IGNORE_COMBINATION_WITH_SAME_DEFAULLT; double e_value_max = surfacing.MAX_E_VALUE_DEFAULT; @@ -631,10 +627,22 @@ public class surfacing { if ( dissallowed_options.length() > 0 ) { ForesterUtil.fatalError( surfacing.PRG_NAME, "unknown option(s): " + dissallowed_options ); } + boolean use_last_in_fitch_parsimony = false; + if ( cla.isOptionSet( USE_LAST_IN_FITCH_OPTION ) ) { + use_last_in_fitch_parsimony = true; + } boolean write_to_nexus = false; if ( cla.isOptionSet( WRITE_TO_NEXUS_OPTION ) ) { write_to_nexus = true; } + boolean perform_dc_regain_proteins_stats = false; + if ( cla.isOptionSet( PERFORM_DC_REGAIN_PROTEINS_STATS_OPTION ) ) { + perform_dc_regain_proteins_stats = true; + } + boolean da_analysis = false; + if ( cla.isOptionSet( DA_ANALYSIS_OPTION ) ) { + da_analysis = true; + } boolean output_binary_domain_combinationsfor_graph_analysis = false; if ( cla.isOptionSet( DOMAIN_COMBINITONS_OUTPUT_OPTION_FOR_GRAPH_ANALYSIS ) ) { output_binary_domain_combinationsfor_graph_analysis = true; @@ -1145,56 +1153,9 @@ public class surfacing { && ( number_of_genomes > 2 ) ) { domain_similarity_sort_field = DomainSimilarity.DomainSimilaritySortField.ABS_MAX_COUNTS_DIFFERENCE; } - boolean jacknifed_distances = false; - int jacknife_resamplings = JACKNIFE_NUMBER_OF_RESAMPLINGS_DEFAULT; - double jacknife_ratio = JACKNIFE_RATIO_DEFAULT; - long random_seed = JACKNIFE_RANDOM_SEED_DEFAULT; - if ( cla.isOptionSet( surfacing.JACKNIFE_OPTION ) ) { - if ( ( number_of_genomes < 3 ) || !perform_pwc ) { - ForesterUtil.fatalError( surfacing.PRG_NAME, "cannot use jacknife resampling analysis (-" - + surfacing.JACKNIFE_OPTION + "[=]) without pairwise analyses (" - + surfacing.PAIRWISE_DOMAIN_COMPARISONS_OPTION - + "=)" ); - } - jacknifed_distances = true; - if ( cla.isOptionHasAValue( surfacing.JACKNIFE_OPTION ) ) { - try { - jacknife_resamplings = cla.getOptionValueAsInt( surfacing.JACKNIFE_OPTION ); - } - catch ( final IOException e ) { - ForesterUtil.fatalError( surfacing.PRG_NAME, "illegal format for number of resamplings" ); - } - if ( jacknife_resamplings < 2 ) { - ForesterUtil.fatalError( surfacing.PRG_NAME, "attempt to use less than 2 resamplings" ); - } - } - if ( cla.isOptionSet( surfacing.JACKNIFE_RATIO_OPTION ) - && cla.isOptionHasAValue( surfacing.JACKNIFE_RATIO_OPTION ) ) { - try { - jacknife_ratio = cla.getOptionValueAsDouble( surfacing.JACKNIFE_RATIO_OPTION ); - } - catch ( final IOException e ) { - ForesterUtil.fatalError( surfacing.PRG_NAME, "illegal format for jacknife ratio" ); - } - if ( ( jacknife_ratio <= 0.0 ) || ( jacknife_ratio >= 1.0 ) ) { - ForesterUtil.fatalError( surfacing.PRG_NAME, "attempt to use illegal value for jacknife ratio: " - + jacknife_ratio ); - } - } - if ( cla.isOptionSet( surfacing.JACKNIFE_RANDOM_SEED_OPTION ) - && cla.isOptionHasAValue( surfacing.JACKNIFE_RANDOM_SEED_OPTION ) ) { - try { - random_seed = cla.getOptionValueAsLong( surfacing.JACKNIFE_RANDOM_SEED_OPTION ); - } - catch ( final IOException e ) { - ForesterUtil.fatalError( surfacing.PRG_NAME, "illegal format for random generator seed" ); - } - } - } File[] intree_files = null; Phylogeny[] intrees = null; if ( cla.isOptionSet( surfacing.INPUT_SPECIES_TREE_OPTION ) ) { - // TODO FIXME if jacknife.... maybe not if ( number_of_genomes < 3 ) { ForesterUtil.fatalError( surfacing.PRG_NAME, "cannot infer gains and losses on input species trees (-" + surfacing.INPUT_SPECIES_TREE_OPTION + " without pairwise analyses (" @@ -1398,20 +1359,34 @@ public class surfacing { + ( dc_type == BinaryDomainCombination.DomainCombinationType.DIRECTED_ADJACTANT ) + "" + nl ); } + System.out.println( "Use last in Fitch parimony : " + use_last_in_fitch_parsimony ); + html_desc.append( "Use last in Fitch parimon:" + use_last_in_fitch_parsimony + "" + + nl ); System.out.println( "Write to Nexus files : " + write_to_nexus ); + html_desc.append( "Write to Nexus files:" + write_to_nexus + "" + nl ); + System.out.println( "DC regain prot stats : " + perform_dc_regain_proteins_stats ); + html_desc.append( "DC regain prot stats:" + perform_dc_regain_proteins_stats + "" + + nl ); + System.out.println( "DA analysis : " + da_analysis ); + html_desc.append( "DA analysis :" + da_analysis + "" + nl ); System.out.print( "Domain counts sort order : " ); + html_desc.append( "Domain counts sort order:" ); switch ( dc_sort_order ) { case ALPHABETICAL_KEY_ID: System.out.println( "alphabetical" ); + html_desc.append( "alphabetical" + "" + nl ); break; case KEY_DOMAIN_COUNT: System.out.println( "domain count" ); + html_desc.append( "domain count" + "" + nl ); break; case KEY_DOMAIN_PROTEINS_COUNT: System.out.println( "domain proteins count" ); + html_desc.append( "domain proteins count" + "" + nl ); break; case COMBINATIONS_COUNT: System.out.println( "domain combinations count" ); + html_desc.append( "domain combinations count" + "" + nl ); break; default: ForesterUtil.unexpectedFatalError( surfacing.PRG_NAME, "unknown value for dc sort order" ); @@ -1575,15 +1550,6 @@ public class surfacing { } System.out.println(); html_desc.append( "" + nl ); - if ( jacknifed_distances ) { - html_desc.append( "Jacknife:" + jacknife_resamplings + " resamplings" + nl ); - html_desc.append( "Jacknife ratio:" + ForesterUtil.round( jacknife_ratio, 2 ) - + "" + nl ); - html_desc.append( "Jacknife random number seed:" + random_seed + "" + nl ); - System.out.println( " Jacknife : " + jacknife_resamplings + " resamplings" ); - System.out.println( " Ratio : " + ForesterUtil.round( jacknife_ratio, 2 ) ); - System.out.println( " Random number seed : " + random_seed ); - } if ( ( intrees != null ) && ( intrees.length > 0 ) ) { for( final File intree_file : intree_files ) { html_desc.append( "Intree for gain/loss parsimony analysis:" + intree_file @@ -1657,7 +1623,7 @@ public class surfacing { if ( need_protein_lists_per_species ) { protein_lists_per_species = new TreeMap>(); } - final List gwcd_list = new ArrayList( number_of_genomes ); + List gwcd_list = new ArrayList( number_of_genomes ); final SortedSet all_domains_encountered = new TreeSet(); final SortedSet all_bin_domain_combinations_encountered = new TreeSet(); List all_bin_domain_combinations_gained_fitch = null; @@ -1666,7 +1632,7 @@ public class surfacing { all_bin_domain_combinations_gained_fitch = new ArrayList(); all_bin_domain_combinations_lost_fitch = new ArrayList(); } - final DomainLengthsTable domain_lengths_table = new DomainLengthsTable(); + DomainLengthsTable domain_lengths_table = new DomainLengthsTable(); final File per_genome_domain_promiscuity_statistics_file = new File( out_dir + ForesterUtil.FILE_SEPARATOR + output_file + D_PROMISCUITY_FILE_SUFFIX ); BufferedWriter per_genome_domain_promiscuity_statistics_writer = null; @@ -1733,7 +1699,7 @@ public class surfacing { Map protein_length_stats_by_dc = null; Map domain_number_stats_by_dc = null; final Map domain_length_stats_by_domain = new HashMap(); - if ( PERFORM_DC_REGAIN_PROTEINS_STATS ) { + if ( perform_dc_regain_proteins_stats ) { protein_length_stats_by_dc = new HashMap(); domain_number_stats_by_dc = new HashMap(); } @@ -1810,7 +1776,7 @@ public class surfacing { final double coverage = ( double ) protein_list.size() / parser.getProteinsEncountered(); protein_coverage_stats.addValue( coverage ); int distinct_das = -1; - if ( DA_ANALYSIS ) { + if ( da_analysis ) { final String genome = input_file_properties[ i ][ 0 ]; distinct_das = SurfacingUtil.storeDomainArchitectures( genome, distinct_domain_architecutures_per_genome, @@ -1870,29 +1836,12 @@ public class surfacing { log( "Proteins ignored due to positive filter : " + parser.getProteinsIgnoredDueToFilter(), log_writer ); } - if ( DA_ANALYSIS ) { + if ( da_analysis ) { System.out.println( "Distinct domain architectures stored : " + distinct_das ); log( "Distinct domain architectures stored : " + distinct_das, log_writer ); } System.out.println( "Time for processing : " + parser.getTime() + "ms" ); log( "", log_writer ); - html_desc.append( "" + input_file_properties[ i ][ 0 ] + " [species: " - + input_file_properties[ i ][ 1 ] + "]" + ":domains analyzed: " - + parser.getDomainsStored() + "; domains ignored: [ind score cutoffs: " - + parser.getDomainsIgnoredDueToIndividualScoreCutoff() + "] [E-value cutoff: " - + parser.getDomainsIgnoredDueToEval() + "] [DUF: " + parser.getDomainsIgnoredDueToDuf() - + "] [virus like ids: " + parser.getDomainsIgnoredDueToVirusLikeIds() - + "] [negative domain filter: " + parser.getDomainsIgnoredDueToNegativeDomainFilter() - + "] [overlap: " + parser.getDomainsIgnoredDueToOverlap() + "]" ); - if ( negative_filter_file != null ) { - html_desc.append( "; proteins ignored due to negative filter: " - + parser.getProteinsIgnoredDueToFilter() ); - } - if ( positive_filter_file != null ) { - html_desc.append( "; proteins ignored due to positive filter: " - + parser.getProteinsIgnoredDueToFilter() ); - } - html_desc.append( "" + nl ); try { int count = 0; for( final Protein protein : protein_list ) { @@ -1920,7 +1869,7 @@ public class surfacing { domains_which_never_single, domains_per_potein_stats_writer ); domain_lengths_table.addLengths( protein_list ); - if ( !DA_ANALYSIS ) { + if ( !da_analysis ) { gwcd_list.add( BasicGenomeWideCombinableDomains .createInstance( protein_list, ignore_combination_with_same, @@ -1977,7 +1926,7 @@ public class surfacing { ForesterUtil.programMessage( PRG_NAME, "Wrote domain promiscuities to: " + per_genome_domain_promiscuity_statistics_file ); // - if ( DA_ANALYSIS ) { + if ( da_analysis ) { SurfacingUtil.performDomainArchitectureAnalysis( distinct_domain_architecutures_per_genome, distinct_domain_architecuture_counts, 10, @@ -2061,12 +2010,13 @@ public class surfacing { ForesterUtil.programMessage( PRG_NAME, "Wrote domain length data to: " + domain_lengths_analysis_outfile ); System.out.println(); } + domain_lengths_table = null; final long analysis_start_time = new Date().getTime(); PairwiseDomainSimilarityCalculator pw_calc = null; - // double[] values_for_all_scores_histogram = null; final DomainSimilarityCalculator calc = new BasicDomainSimilarityCalculator( domain_similarity_sort_field, sort_by_species_count_first, - number_of_genomes == 2 ); + number_of_genomes == 2, + CALC_SIMILARITY_SCORES ); switch ( scoring ) { case COMBINATIONS: pw_calc = new CombinationsBasedPairwiseDomainSimilarityCalculator(); @@ -2089,11 +2039,7 @@ public class surfacing { gwcd_list, ignore_domains_without_combs_in_all_spec, ignore_species_specific_domains ); - SurfacingUtil.decoratePrintableDomainSimilarities( similarities, - detailedness, - go_annotation_output, - go_id_to_term_map, - go_namespace_limit ); + SurfacingUtil.decoratePrintableDomainSimilarities( similarities, detailedness ); final Map tax_code_to_id_map = SurfacingUtil.createTaxCodeToIdMap( intrees[ 0 ] ); try { String my_outfile = output_file.toString(); @@ -2125,19 +2071,21 @@ public class surfacing { + new java.text.SimpleDateFormat( "yyyy.MM.dd HH:mm:ss" ).format( new java.util.Date() ) + "" + nl ); html_desc.append( "" + nl ); - final DescriptiveStatistics pw_stats = SurfacingUtil - .writeDomainSimilaritiesToFile( html_desc, - new StringBuilder( number_of_genomes + " genomes" ), - writer, - split_writers, - similarities, - number_of_genomes == 2, - species_order, - domain_similarity_print_option, - domain_similarity_sort_field, - scoring, - true, - tax_code_to_id_map ); + final Writer simple_tab_writer = new BufferedWriter( new FileWriter( out_dir + ForesterUtil.FILE_SEPARATOR + + my_outfile + ".tsv" ) ); + SurfacingUtil.writeDomainSimilaritiesToFile( html_desc, + new StringBuilder( number_of_genomes + " genomes" ), + simple_tab_writer, + writer, + split_writers, + similarities, + number_of_genomes == 2, + species_order, + domain_similarity_print_option, + scoring, + true, + tax_code_to_id_map ); + simple_tab_writer.close(); ForesterUtil.programMessage( surfacing.PRG_NAME, "Wrote main output (includes domain similarities) to: \"" + ( out_dir == null ? my_outfile : out_dir + ForesterUtil.FILE_SEPARATOR + my_outfile ) + "\"" ); } @@ -2174,7 +2122,8 @@ public class surfacing { surfacing.PRG_NAME, out_dir, write_pwc_files, - tax_code_to_id_map ); + tax_code_to_id_map, + CALC_SIMILARITY_SCORES ); String matrix_output_file = new String( output_file.toString() ); if ( matrix_output_file.indexOf( '.' ) > 1 ) { matrix_output_file = matrix_output_file.substring( 0, matrix_output_file.indexOf( '.' ) ); @@ -2205,35 +2154,6 @@ public class surfacing { inferred_trees.add( nj_gd ); inferred_trees.add( nj_bc ); inferred_trees.add( nj_d ); - if ( jacknifed_distances ) { - pwgc.performPairwiseComparisonsJacknifed( species, - number_of_genomes, - gwcd_list, - true, - jacknife_resamplings, - jacknife_ratio, - random_seed ); - SurfacingUtil - .writeMatrixToFile( new File( matrix_output_file - + "_" - + ForesterUtil.round( jacknife_ratio, 2 ) - + "_" - + jacknife_resamplings - + surfacing.MATRIX_SHARED_BIN_COMBINATIONS_BASED_GENOME_DISTANCE_SUFFIX ), - pwgc.getSharedBinaryCombinationsBasedDistances() ); - SurfacingUtil - .writeMatrixToFile( new File( matrix_output_file + "_" + ForesterUtil.round( jacknife_ratio, 2 ) - + "_" + jacknife_resamplings - + surfacing.MATRIX_SHARED_DOMAINS_BASED_GENOME_DISTANCE_SUFFIX ), - pwgc.getSharedDomainsBasedDistances() ); - // if ( infer_species_trees ) { - // inferSpeciesTrees( new File( output_file + "_" + jacknife_resamplings - // + INFERRED_SBC_BASED_NJ_SPECIES_TREE_SUFFIX ), pwgc - // .getSharedBinaryCombinationsBasedDistances() ); - // inferSpeciesTrees( new File( output_file + "_" + jacknife_resamplings - // + INFERRED_SD_BASED_NJ_SPECIES_TREE_SUFFIX ), pwgc.getSharedDomainsBasedDistances() ); - // } - } } // if ( ( output_file != null ) && ( number_of_genomes > 2 ) && !isEmpty( automated_pairwise_comparison_suffix ) ) if ( ( out_dir != null ) && ( !perform_pwc ) ) { output_file = new File( out_dir + ForesterUtil.FILE_SEPARATOR + output_file ); @@ -2277,7 +2197,8 @@ public class surfacing { domain_number_stats_by_dc, domain_length_stats_by_domain, tax_code_to_id_map, - write_to_nexus ); + write_to_nexus, + use_last_in_fitch_parsimony ); // Listing of all domain combinations gained is only done if only one input tree is used. if ( ( domain_id_to_secondary_features_maps != null ) && ( domain_id_to_secondary_features_maps.length > 0 ) ) { @@ -2293,7 +2214,8 @@ public class surfacing { secondary_features_parsimony, intree, parameters_sb.toString(), - mapping_results_map ); + mapping_results_map, + use_last_in_fitch_parsimony ); if ( i == 0 ) { System.out.println(); System.out.println( "Mapping to secondary features:" ); @@ -2335,6 +2257,7 @@ public class surfacing { gwcd_list, output_list_of_all_proteins_per_domain_e_value_max ); } + gwcd_list = null; if ( all_bin_domain_combinations_gained_fitch != null ) { try { executeFitchGainsAnalysis( new File( output_file @@ -2550,17 +2473,6 @@ public class surfacing { System.out.println( surfacing.INPUT_SPECIES_TREE_OPTION + ": species tree, to perform (Dollo, Fitch) parismony analyses" ); System.out - .println( JACKNIFE_OPTION - + ": perform jacknife resampling for domain and binary domain combination based distance matrices [default resamplings: " - + JACKNIFE_NUMBER_OF_RESAMPLINGS_DEFAULT + "]" ); - System.out.println( JACKNIFE_RATIO_OPTION + ": ratio for jacknife resampling [default: " - + JACKNIFE_RATIO_DEFAULT + "]" ); - System.out.println( JACKNIFE_RANDOM_SEED_OPTION - + ": seed for random number generator for jacknife resampling [default: " - + JACKNIFE_RANDOM_SEED_DEFAULT + "]" ); - // System.out.println( surfacing.INFER_SPECIES_TREES_OPTION - // + ": to infer NJ species trees based on shared domains/binary domain combinations" ); - System.out .println( surfacing.INPUT_SPECIES_TREE_OPTION + "=: to infer domain/binary domain combination gains/losses on given species trees" ); System.out.println( surfacing.FILTER_POSITIVE_OPTION @@ -2588,7 +2500,10 @@ public class surfacing { System.out.println( surfacing.OUTPUT_LIST_OF_ALL_PROTEINS_OPTIONS + ": to output all proteins per domain" ); System.out.println( surfacing.OUTPUT_LIST_OF_ALL_PROTEINS_PER_DOMAIN_E_VALUE_OPTION + ": e value max per domain for output of all proteins per domain" ); + System.out.println( surfacing.USE_LAST_IN_FITCH_OPTION + ": to use last in Fitch parsimony" ); System.out.println( surfacing.WRITE_TO_NEXUS_OPTION + ": to output in Nexus format" ); + System.out.println( PERFORM_DC_REGAIN_PROTEINS_STATS_OPTION + ": to perform DC regain protein statistics" ); + System.out.println( DA_ANALYSIS_OPTION + ": to do DA analysis" ); System.out.println(); System.out.println( "Example 1: java -Xms128m -Xmx512m -cp path/to/forester.jar" + " org.forester.application.surfacing p2g=pfam2go_2012_02_07.txt -dufs -cos=Pfam_260_NC1"