/*
* Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
* Copyright (C) $$Year-Rel$$ The Jalview Authors
*
* This file is part of Jalview.
*
* Jalview is free software: you can redistribute it and/or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation, either version 3
* of the License, or (at your option) any later version.
*
* Jalview is distributed in the hope that it will be useful, but
* WITHOUT ANY WARRANTY; without even the implied warranty
* of MERCHANTABILITY or FITNESS FOR A PARTICULAR
* PURPOSE. See the GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Jalview. If not, see .
* The Jalview Authors are detailed in the 'AUTHORS' file.
*/
package jalview.analysis;
import static org.testng.AssertJUnit.assertEquals;
import jalview.analysis.AnnotationSorter.SequenceAnnotationOrder;
import jalview.datamodel.Alignment;
import jalview.datamodel.AlignmentAnnotation;
import jalview.datamodel.Sequence;
import jalview.datamodel.SequenceI;
import java.util.ArrayList;
import java.util.List;
import java.util.Random;
import org.testng.annotations.BeforeMethod;
import org.testng.annotations.Test;
public class AnnotationSorterTest
{
private static final int NUM_SEQS = 6;
private static final int NUM_ANNS = 7;
private static final String SS = "secondary structure";
AlignmentAnnotation[] anns = new AlignmentAnnotation[0];
Alignment al = null;
/*
* Set up 6 sequences and 7 annotations.
*/
@BeforeMethod(alwaysRun = true)
public void setUp()
{
al = buildAlignment(NUM_SEQS);
anns = buildAnnotations(NUM_ANNS);
}
/**
* Construct an array of numAnns annotations
*
* @param numAnns
*
* @return
*/
protected AlignmentAnnotation[] buildAnnotations(int numAnns)
{
List annlist = new ArrayList();
for (int i = 0; i < numAnns; i++)
{
AlignmentAnnotation ann = new AlignmentAnnotation(SS + i, "", 0);
annlist.add(ann);
}
return annlist.toArray(anns);
}
/**
* Make an alignment with numSeqs sequences in it.
*
* @param numSeqs
*
* @return
*/
private Alignment buildAlignment(int numSeqs)
{
SequenceI[] seqs = new Sequence[numSeqs];
for (int i = 0; i < numSeqs; i++)
{
seqs[i] = new Sequence("Sequence" + i, "axrdkfp");
}
return new Alignment(seqs);
}
/**
* Test sorting by annotation type (label) within sequence order, including
*
* - annotations with no sequence reference - sort to end keeping mutual
* ordering
* - annotations with sequence ref = sort in sequence order
* - multiple annotations for same sequence ref - sort by label
* non-case-specific
* - annotations with reference to sequence not in alignment - treat like no
* sequence ref
*
*/
@Test(groups = { "Functional" })
public void testSortBySequenceAndType_autocalcLast()
{
// @formatter:off
anns[0].sequenceRef = al.getSequenceAt(1); anns[0].label = "label0";
anns[1].sequenceRef = al.getSequenceAt(3); anns[1].label = "structure";
anns[2].sequenceRef = al.getSequenceAt(3); anns[2].label = "iron";
anns[3].autoCalculated = true; anns[3].label = "Quality";
anns[4].autoCalculated = true; anns[4].label = "Consensus";
anns[5].sequenceRef = al.getSequenceAt(0); anns[5].label = "label5";
anns[6].sequenceRef = al.getSequenceAt(3); anns[6].label = "IRP";
// @formatter:on
AnnotationSorter testee = new AnnotationSorter(al, false);
testee.sort(anns, SequenceAnnotationOrder.SEQUENCE_AND_LABEL);
assertEquals("label5", anns[0].label); // for sequence 0
assertEquals("label0", anns[1].label); // for sequence 1
assertEquals("iron", anns[2].label); // sequence 3 /iron
assertEquals("IRP", anns[3].label); // sequence 3/IRP
assertEquals("structure", anns[4].label); // sequence 3/structure
assertEquals("Quality", anns[5].label); // autocalc annotations
assertEquals("Consensus", anns[6].label); // retain ordering
}
/**
* Variant with autocalculated annotations sorting to front
*/
@Test(groups = { "Functional" })
public void testSortBySequenceAndType_autocalcFirst()
{
// @formatter:off
anns[0].sequenceRef = al.getSequenceAt(1); anns[0].label = "label0";
anns[1].sequenceRef = al.getSequenceAt(3); anns[1].label = "structure";
anns[2].sequenceRef = al.getSequenceAt(3); anns[2].label = "iron";
anns[3].autoCalculated = true; anns[3].label = "Quality";
anns[4].autoCalculated = true; anns[4].label = "Consensus";
anns[5].sequenceRef = al.getSequenceAt(0); anns[5].label = "label5";
anns[6].sequenceRef = al.getSequenceAt(3); anns[6].label = "IRP";
// @formatter:on
AnnotationSorter testee = new AnnotationSorter(al, true);
testee.sort(anns, SequenceAnnotationOrder.SEQUENCE_AND_LABEL);
assertEquals("Quality", anns[0].label); // autocalc annotations
assertEquals("Consensus", anns[1].label); // retain ordering
assertEquals("label5", anns[2].label); // for sequence 0
assertEquals("label0", anns[3].label); // for sequence 1
assertEquals("iron", anns[4].label); // sequence 3 /iron
assertEquals("IRP", anns[5].label); // sequence 3/IRP
assertEquals("structure", anns[6].label); // sequence 3/structure
}
/**
* Test sorting by annotation type (label) within sequence order, including
*
* - annotations with no sequence reference - sort to end keeping mutual
* ordering
* - annotations with sequence ref = sort in sequence order
* - multiple annotations for same sequence ref - sort by label
* non-case-specific
* - annotations with reference to sequence not in alignment - treat like no
* sequence ref
*
*/
@Test(groups = { "Functional" })
public void testSortByTypeAndSequence_autocalcLast()
{
// @formatter:off
anns[0].sequenceRef = al.getSequenceAt(1); anns[0].label = "label0";
anns[1].sequenceRef = al.getSequenceAt(3); anns[1].label = "structure";
anns[2].sequenceRef = al.getSequenceAt(3); anns[2].label = "iron";
anns[3].autoCalculated = true; anns[3].label = "Quality";
anns[4].autoCalculated = true; anns[4].label = "Consensus";
anns[5].sequenceRef = al.getSequenceAt(0); anns[5].label = "IRON";
anns[6].sequenceRef = al.getSequenceAt(2); anns[6].label = "Structure";
// @formatter:on
AnnotationSorter testee = new AnnotationSorter(al, false);
testee.sort(anns, SequenceAnnotationOrder.LABEL_AND_SEQUENCE);
assertEquals("IRON", anns[0].label); // IRON / sequence 0
assertEquals("iron", anns[1].label); // iron / sequence 3
assertEquals("label0", anns[2].label); // label0 / sequence 1
assertEquals("Structure", anns[3].label); // Structure / sequence 2
assertEquals("structure", anns[4].label); // structure / sequence 3
assertEquals("Quality", anns[5].label); // autocalc annotations
assertEquals("Consensus", anns[6].label); // retain ordering
}
/**
* Variant of test with autocalculated annotations sorted to front
*/
@Test(groups = { "Functional" })
public void testSortByTypeAndSequence_autocalcFirst()
{
// @formatter:off
anns[0].sequenceRef = al.getSequenceAt(1); anns[0].label = "label0";
anns[1].sequenceRef = al.getSequenceAt(3); anns[1].label = "structure";
anns[2].sequenceRef = al.getSequenceAt(3); anns[2].label = "iron";
anns[3].autoCalculated = true; anns[3].label = "Quality";
anns[4].autoCalculated = true; anns[4].label = "Consensus";
anns[5].sequenceRef = al.getSequenceAt(0); anns[5].label = "IRON";
anns[6].sequenceRef = al.getSequenceAt(2); anns[6].label = "Structure";
// @formatter:on
AnnotationSorter testee = new AnnotationSorter(al, true);
testee.sort(anns, SequenceAnnotationOrder.LABEL_AND_SEQUENCE);
assertEquals("Quality", anns[0].label); // autocalc annotations
assertEquals("Consensus", anns[1].label); // retain ordering
assertEquals("IRON", anns[2].label); // IRON / sequence 0
assertEquals("iron", anns[3].label); // iron / sequence 3
assertEquals("label0", anns[4].label); // label0 / sequence 1
assertEquals("Structure", anns[5].label); // Structure / sequence 2
assertEquals("structure", anns[6].label); // structure / sequence 3
}
/**
* Variant of test with autocalculated annotations sorted to front but
* otherwise no change.
*/
@Test(groups = { "Functional" })
public void testNoSort_autocalcFirst()
{
// @formatter:off
anns[0].sequenceRef = al.getSequenceAt(1); anns[0].label = "label0";
anns[1].sequenceRef = al.getSequenceAt(3); anns[1].label = "structure";
anns[2].sequenceRef = al.getSequenceAt(3); anns[2].label = "iron";
anns[3].autoCalculated = true; anns[3].label = "Quality";
anns[4].autoCalculated = true; anns[4].label = "Consensus";
anns[5].sequenceRef = al.getSequenceAt(0); anns[5].label = "IRON";
anns[6].sequenceRef = al.getSequenceAt(2); anns[6].label = "Structure";
// @formatter:on
AnnotationSorter testee = new AnnotationSorter(al, true);
testee.sort(anns, SequenceAnnotationOrder.NONE);
assertEquals("Quality", anns[0].label); // autocalc annotations
assertEquals("Consensus", anns[1].label); // retain ordering
assertEquals("label0", anns[2].label);
assertEquals("structure", anns[3].label);
assertEquals("iron", anns[4].label);
assertEquals("IRON", anns[5].label);
assertEquals("Structure", anns[6].label);
}
@Test(groups = { "Functional" })
public void testSort_timingPresorted()
{
testTiming_presorted(50, 100);
testTiming_presorted(500, 1000);
testTiming_presorted(5000, 10000);
}
/**
* Test timing to sort annotations already in the sort order.
*
* @param numSeqs
* @param numAnns
*/
private void testTiming_presorted(final int numSeqs, final int numAnns)
{
Alignment alignment = buildAlignment(numSeqs);
AlignmentAnnotation[] annotations = buildAnnotations(numAnns);
/*
* Set the annotations presorted by label
*/
Random r = new Random();
final SequenceI[] sequences = alignment.getSequencesArray();
for (int i = 0; i < annotations.length; i++)
{
SequenceI randomSequenceRef = sequences[r.nextInt(sequences.length)];
annotations[i].sequenceRef = randomSequenceRef;
annotations[i].label = "label" + i;
}
long startTime = System.currentTimeMillis();
AnnotationSorter testee = new AnnotationSorter(alignment, false);
testee.sort(annotations, SequenceAnnotationOrder.LABEL_AND_SEQUENCE);
long endTime = System.currentTimeMillis();
final long elapsed = endTime - startTime;
System.out.println("Timing test for presorted " + numSeqs
+ " sequences and " + numAnns + " annotations took " + elapsed
+ "ms");
}
/**
* Timing tests for sorting randomly sorted annotations for various sizes.
*/
@Test(groups = { "Functional" })
public void testSort_timingUnsorted()
{
testTiming_unsorted(50, 100);
testTiming_unsorted(500, 1000);
testTiming_unsorted(5000, 10000);
}
/**
* Generate annotations randomly sorted with respect to sequences, and time
* sorting.
*
* @param numSeqs
* @param numAnns
*/
private void testTiming_unsorted(final int numSeqs, final int numAnns)
{
Alignment alignment = buildAlignment(numSeqs);
AlignmentAnnotation[] annotations = buildAnnotations(numAnns);
/*
* Set the annotations in random order with respect to the sequences
*/
Random r = new Random();
final SequenceI[] sequences = alignment.getSequencesArray();
for (int i = 0; i < annotations.length; i++)
{
SequenceI randomSequenceRef = sequences[r.nextInt(sequences.length)];
annotations[i].sequenceRef = randomSequenceRef;
annotations[i].label = "label" + i;
}
long startTime = System.currentTimeMillis();
AnnotationSorter testee = new AnnotationSorter(alignment, false);
testee.sort(annotations, SequenceAnnotationOrder.SEQUENCE_AND_LABEL);
long endTime = System.currentTimeMillis();
final long elapsed = endTime - startTime;
System.out.println("Timing test for unsorted " + numSeqs
+ " sequences and " + numAnns + " annotations took " + elapsed
+ "ms");
}
/**
* Timing test for sorting annotations with a limited range of types (labels).
*/
@Test(groups = { "Functional" })
public void testSort_timingSemisorted()
{
testTiming_semiSorted(50, 100);
testTiming_semiSorted(500, 1000);
testTiming_semiSorted(5000, 10000);
}
/**
* Mimic 'semi-sorted' annotations:
*
* - set up in sequence order, with randomly assigned labels from a limited
* range
* - sort by label and sequence order, report timing
* - resort by sequence and label, report timing
* - resort by label and sequence, report timing
*
*
* @param numSeqs
* @param numAnns
*/
private void testTiming_semiSorted(final int numSeqs, final int numAnns)
{
Alignment alignment = buildAlignment(numSeqs);
AlignmentAnnotation[] annotations = buildAnnotations(numAnns);
String[] labels = new String[] { "label1", "label2", "label3",
"label4", "label5", "label6" };
/*
* Set the annotations in sequence order with randomly assigned labels.
*/
Random r = new Random();
final SequenceI[] sequences = alignment.getSequencesArray();
for (int i = 0; i < annotations.length; i++)
{
SequenceI sequenceRef = sequences[i % sequences.length];
annotations[i].sequenceRef = sequenceRef;
annotations[i].label = labels[r.nextInt(labels.length)];
}
long startTime = System.currentTimeMillis();
AnnotationSorter testee = new AnnotationSorter(alignment, false);
testee.sort(annotations, SequenceAnnotationOrder.LABEL_AND_SEQUENCE);
long endTime = System.currentTimeMillis();
long elapsed = endTime - startTime;
System.out.println("Sort by label for semisorted " + numSeqs
+ " sequences and " + numAnns + " annotations took " + elapsed
+ "ms");
// now resort by sequence
startTime = System.currentTimeMillis();
testee.sort(annotations, SequenceAnnotationOrder.SEQUENCE_AND_LABEL);
endTime = System.currentTimeMillis();
elapsed = endTime - startTime;
System.out.println("Resort by sequence for semisorted " + numSeqs
+ " sequences and " + numAnns + " annotations took " + elapsed
+ "ms");
// now resort by label
startTime = System.currentTimeMillis();
testee.sort(annotations, SequenceAnnotationOrder.LABEL_AND_SEQUENCE);
endTime = System.currentTimeMillis();
elapsed = endTime - startTime;
System.out.println("Resort by label for semisorted " + numSeqs
+ " sequences and " + numAnns + " annotations took " + elapsed
+ "ms");
}
}