package jalview.ext.ensembl; import static org.testng.AssertJUnit.assertEquals; import static org.testng.AssertJUnit.assertNull; import jalview.datamodel.SequenceDummy; import jalview.datamodel.SequenceFeature; import jalview.datamodel.SequenceI; import jalview.io.gff.SequenceOntologyFactory; import jalview.io.gff.SequenceOntologyLite; import jalview.util.MapList; import java.util.List; import org.testng.annotations.Test; public class EnsemblCdnaTest { /** * Test that the cdna part of genomic sequence is correctly identified by * 'exon' features (or subtypes) - reverse strand case. */ @Test(groups = "Functional") public void getGenomicRangesFromFeatures_reverseStrand() { EnsemblCdna testee = new EnsemblCdna(); SequenceI genomic = new SequenceDummy("chr7"); genomic.setStart(10000); genomic.setEnd(50000); String transcriptId = "ABC123"; // exon at (start+10000) length 501 SequenceFeature sf = new SequenceFeature("exon", "", 20000, 20500, 0f, null); sf.setValue("Parent", "transcript:" + transcriptId); sf.setStrand("-"); genomic.addSequenceFeature(sf); // exon (sub-type) at (start + exon_variant) length 101 sf = new SequenceFeature("coding_exon", "", 10500, 10600, 0f, null); sf.setValue("Parent", "transcript:" + transcriptId); sf.setStrand("-"); genomic.addSequenceFeature(sf); // exon belonging to a different transcript doesn't count sf = new SequenceFeature("exon", "", 11500, 12600, 0f, null); sf.setValue("Parent", "transcript:anotherOne"); genomic.addSequenceFeature(sf); // transcript feature doesn't count sf = new SequenceFeature("transcript", "", 10000, 50000, 0f, null); genomic.addSequenceFeature(sf); SequenceOntologyFactory.setInstance(new SequenceOntologyLite()); MapList ranges = testee.getGenomicRangesFromFeatures(genomic, transcriptId, 23); List fromRanges = ranges.getFromRanges(); assertEquals(2, fromRanges.size()); /* * from ranges should be sorted by start order descending * and hold mappings from reverse strand sense */ assertEquals(20500, fromRanges.get(0)[0]); assertEquals(20000, fromRanges.get(0)[1]); assertEquals(10600, fromRanges.get(1)[0]); assertEquals(10500, fromRanges.get(1)[1]); // to range should start from given start numbering List toRanges = ranges.getToRanges(); assertEquals(1, toRanges.size()); assertEquals(23, toRanges.get(0)[0]); assertEquals(624, toRanges.get(0)[1]); } /** * Test that the cdna part of genomic sequence is correctly identified by * 'exon' features (or subtypes). */ @Test(groups = "Functional") public void getGenomicRangesFromFeatures() { EnsemblCdna testee = new EnsemblCdna(); SequenceI genomic = new SequenceDummy("chr7"); genomic.setStart(10000); genomic.setEnd(50000); String transcriptId = "ABC123"; // exon at (start+10000) length 501 SequenceFeature sf = new SequenceFeature("exon", "", 20000, 20500, 0f, null); sf.setValue("Parent", "transcript:" + transcriptId); sf.setStrand("+"); genomic.addSequenceFeature(sf); // exon (sub-type) at (start + exon_variant) length 101 sf = new SequenceFeature("coding_exon", "", 10500, 10600, 0f, null); sf.setValue("Parent", "transcript:" + transcriptId); sf.setStrand("+"); genomic.addSequenceFeature(sf); // exon belonging to a different transcript doesn't count sf = new SequenceFeature("exon", "", 11500, 12600, 0f, null); sf.setValue("Parent", "transcript:anotherOne"); genomic.addSequenceFeature(sf); // transcript feature doesn't count sf = new SequenceFeature("transcript", "", 10000, 50000, 0f, null); sf.setStrand("-"); // weird but ignored genomic.addSequenceFeature(sf); SequenceOntologyFactory.setInstance(new SequenceOntologyLite()); MapList ranges = testee.getGenomicRangesFromFeatures(genomic, transcriptId, 23); List fromRanges = ranges.getFromRanges(); assertEquals(2, fromRanges.size()); // from ranges should be sorted by start order assertEquals(10500, fromRanges.get(0)[0]); assertEquals(10600, fromRanges.get(0)[1]); assertEquals(20000, fromRanges.get(1)[0]); assertEquals(20500, fromRanges.get(1)[1]); // to range should start from given start numbering List toRanges = ranges.getToRanges(); assertEquals(1, toRanges.size()); assertEquals(23, toRanges.get(0)[0]); assertEquals(624, toRanges.get(0)[1]); } /** * The method under test should give up and return null if both forward and * reverse strands are present in the features of interest */ @Test(groups = "Functional") public void getGenomicRangesFromFeatures_mixedStrand() { EnsemblCdna testee = new EnsemblCdna(); SequenceI genomic = new SequenceDummy("chr7"); genomic.setStart(10000); genomic.setEnd(50000); String transcriptId = "ABC123"; SequenceFeature sf = new SequenceFeature("exon", "", 20000, 20500, 0f, null); sf.setValue("Parent", "transcript:" + transcriptId); sf.setStrand("-"); genomic.addSequenceFeature(sf); sf = new SequenceFeature("coding_exon", "", 10500, 10600, 0f, null); sf.setValue("Parent", "transcript:" + transcriptId); sf.setStrand("+"); genomic.addSequenceFeature(sf); SequenceOntologyFactory.setInstance(new SequenceOntologyLite()); MapList ranges = testee.getGenomicRangesFromFeatures(genomic, transcriptId, 23); assertNull(ranges); } }