X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=test%2Fjalview%2Fext%2Fensembl%2FEnsemblCdnaTest.java;h=9e9d9a422673456b7cb7e4bfe35c7810ace63501;hb=3c8a25936a2d805e7e3d7ab82f83b13135406d18;hp=30bc81ba709a740ee774214349dd9b892f2e0d52;hpb=e7a5ac489e89d1c97ba55c817015945ed208f495;p=jalview.git diff --git a/test/jalview/ext/ensembl/EnsemblCdnaTest.java b/test/jalview/ext/ensembl/EnsemblCdnaTest.java index 30bc81b..9e9d9a4 100644 --- a/test/jalview/ext/ensembl/EnsemblCdnaTest.java +++ b/test/jalview/ext/ensembl/EnsemblCdnaTest.java @@ -1,27 +1,74 @@ +/* + * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$) + * Copyright (C) $$Year-Rel$$ The Jalview Authors + * + * This file is part of Jalview. + * + * Jalview is free software: you can redistribute it and/or + * modify it under the terms of the GNU General Public License + * as published by the Free Software Foundation, either version 3 + * of the License, or (at your option) any later version. + * + * Jalview is distributed in the hope that it will be useful, but + * WITHOUT ANY WARRANTY; without even the implied warranty + * of MERCHANTABILITY or FITNESS FOR A PARTICULAR + * PURPOSE. See the GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with Jalview. If not, see . + * The Jalview Authors are detailed in the 'AUTHORS' file. + */ package jalview.ext.ensembl; import static org.testng.AssertJUnit.assertEquals; +import static org.testng.AssertJUnit.assertFalse; import static org.testng.AssertJUnit.assertNull; +import static org.testng.AssertJUnit.assertTrue; +import jalview.datamodel.Sequence; import jalview.datamodel.SequenceDummy; import jalview.datamodel.SequenceFeature; import jalview.datamodel.SequenceI; +import jalview.gui.JvOptionPane; import jalview.io.gff.SequenceOntologyFactory; import jalview.io.gff.SequenceOntologyLite; import jalview.util.MapList; import java.util.List; +import org.testng.Assert; +import org.testng.annotations.AfterClass; +import org.testng.annotations.BeforeClass; import org.testng.annotations.Test; public class EnsemblCdnaTest { + + @BeforeClass(alwaysRun = true) + public void setUpJvOptionPane() + { + JvOptionPane.setInteractiveMode(false); + JvOptionPane.setMockResponse(JvOptionPane.CANCEL_OPTION); + } + + @BeforeClass(alwaysRun = true) + public void setUp() + { + SequenceOntologyFactory.setInstance(new SequenceOntologyLite()); + } + + @AfterClass(alwaysRun = true) + public void tearDown() + { + SequenceOntologyFactory.setInstance(null); + } + /** * Test that the cdna part of genomic sequence is correctly identified by * 'exon' features (or subtypes) - reverse strand case. */ @Test(groups = "Functional") - public void getGenomicRangesFromFeatures_reverseStrand() + public void testGetGenomicRangesFromFeatures_reverseStrand() { EnsemblCdna testee = new EnsemblCdna(); SequenceI genomic = new SequenceDummy("chr7"); @@ -32,27 +79,25 @@ public class EnsemblCdnaTest // exon at (start+10000) length 501 SequenceFeature sf = new SequenceFeature("exon", "", 20000, 20500, 0f, null); - sf.setValue("Parent", "transcript:" + transcriptId); + sf.setValue("Parent", transcriptId); sf.setStrand("-"); genomic.addSequenceFeature(sf); // exon (sub-type) at (start + exon_variant) length 101 sf = new SequenceFeature("coding_exon", "", 10500, 10600, 0f, null); - sf.setValue("Parent", "transcript:" + transcriptId); + sf.setValue("Parent", transcriptId); sf.setStrand("-"); genomic.addSequenceFeature(sf); // exon belonging to a different transcript doesn't count sf = new SequenceFeature("exon", "", 11500, 12600, 0f, null); - sf.setValue("Parent", "transcript:anotherOne"); + sf.setValue("Parent", "anotherOne"); genomic.addSequenceFeature(sf); // transcript feature doesn't count sf = new SequenceFeature("transcript", "", 10000, 50000, 0f, null); genomic.addSequenceFeature(sf); - SequenceOntologyFactory.setInstance(new SequenceOntologyLite()); - MapList ranges = testee.getGenomicRangesFromFeatures(genomic, transcriptId, 23); List fromRanges = ranges.getFromRanges(); @@ -75,42 +120,40 @@ public class EnsemblCdnaTest /** * Test that the cdna part of genomic sequence is correctly identified by - * 'exon' features (or subtypes). + * 'exon' features (or subtypes) with the desired transcript as parent */ @Test(groups = "Functional") - public void getGenomicRangesFromFeatures() + public void testGetGenomicRangesFromFeatures() { EnsemblCdna testee = new EnsemblCdna(); SequenceI genomic = new SequenceDummy("chr7"); genomic.setStart(10000); genomic.setEnd(50000); String transcriptId = "ABC123"; - + // exon at (start+10000) length 501 SequenceFeature sf = new SequenceFeature("exon", "", 20000, 20500, 0f, null); - sf.setValue("Parent", "transcript:" + transcriptId); + sf.setValue("Parent", transcriptId); sf.setStrand("+"); genomic.addSequenceFeature(sf); - + // exon (sub-type) at (start + exon_variant) length 101 sf = new SequenceFeature("coding_exon", "", 10500, 10600, 0f, null); - sf.setValue("Parent", "transcript:" + transcriptId); + sf.setValue("Parent", transcriptId); sf.setStrand("+"); genomic.addSequenceFeature(sf); - + // exon belonging to a different transcript doesn't count sf = new SequenceFeature("exon", "", 11500, 12600, 0f, null); - sf.setValue("Parent", "transcript:anotherOne"); + sf.setValue("Parent", "anotherOne"); genomic.addSequenceFeature(sf); - + // transcript feature doesn't count sf = new SequenceFeature("transcript", "", 10000, 50000, 0f, null); sf.setStrand("-"); // weird but ignored genomic.addSequenceFeature(sf); - - SequenceOntologyFactory.setInstance(new SequenceOntologyLite()); - + MapList ranges = testee.getGenomicRangesFromFeatures(genomic, transcriptId, 23); List fromRanges = ranges.getFromRanges(); @@ -132,29 +175,130 @@ public class EnsemblCdnaTest * reverse strands are present in the features of interest */ @Test(groups = "Functional") - public void getGenomicRangesFromFeatures_mixedStrand() + public void testGetGenomicRangesFromFeatures_mixedStrand() { EnsemblCdna testee = new EnsemblCdna(); SequenceI genomic = new SequenceDummy("chr7"); genomic.setStart(10000); genomic.setEnd(50000); String transcriptId = "ABC123"; - + SequenceFeature sf = new SequenceFeature("exon", "", 20000, 20500, 0f, null); sf.setValue("Parent", "transcript:" + transcriptId); sf.setStrand("-"); genomic.addSequenceFeature(sf); - + sf = new SequenceFeature("coding_exon", "", 10500, 10600, 0f, null); sf.setValue("Parent", "transcript:" + transcriptId); sf.setStrand("+"); genomic.addSequenceFeature(sf); - - SequenceOntologyFactory.setInstance(new SequenceOntologyLite()); - + MapList ranges = testee.getGenomicRangesFromFeatures(genomic, transcriptId, 23); assertNull(ranges); } + + /** + * Test the method that retains features except for 'transcript' (or + * subtypes), or features with parent other than the given id + */ + @Test(groups = "Functional") + public void testRetainFeature() + { + String accId = "ABC123"; + EnsemblCdna testee = new EnsemblCdna(); + + SequenceFeature sf = new SequenceFeature("transcript", "", 20000, + 20500, 0f, null); + assertFalse(testee.retainFeature(sf, accId)); + + sf = new SequenceFeature("aberrant_processed_transcript", "", 20000, + 20500, 0f, null); + assertFalse(testee.retainFeature(sf, accId)); + + sf = new SequenceFeature("NMD_transcript_variant", "", 20000, 20500, + 0f, null); + assertFalse(testee.retainFeature(sf, accId)); + + // other feature with no parent is retained + sf = new SequenceFeature("sequence_variant", "", 20000, 20500, 0f, null); + assertTrue(testee.retainFeature(sf, accId)); + + // other feature with desired parent is retained + sf.setValue("Parent", accId); + assertTrue(testee.retainFeature(sf, accId)); + + // test is not case-sensitive + assertTrue(testee.retainFeature(sf, accId.toLowerCase())); + + // feature with wrong parent is not retained + sf.setValue("Parent", "XYZ"); + assertFalse(testee.retainFeature(sf, accId)); + } + + /** + * Test the method that picks out 'exon' (or subtype) features with the + * accession id as parent + */ + @Test(groups = "Functional") + public void testGetIdentifyingFeatures() + { + String accId = "ABC123"; + SequenceI seq = new Sequence(accId, "MKLNFRQIE"); + + // exon with no parent: not valid + SequenceFeature sf1 = new SequenceFeature("exon", "", 1, 2, 0f, null); + seq.addSequenceFeature(sf1); + + // exon with wrong parent: not valid + SequenceFeature sf2 = new SequenceFeature("exon", "", 1, 2, 0f, null); + sf2.setValue("Parent", "XYZ"); + seq.addSequenceFeature(sf2); + + // exon with right parent is valid + SequenceFeature sf3 = new SequenceFeature("exon", "", 1, 2, 0f, null); + sf3.setValue("Parent", accId); + seq.addSequenceFeature(sf3); + + // exon sub-type with right parent is valid + SequenceFeature sf4 = new SequenceFeature("coding_exon", "", 1, 2, 0f, + null); + sf4.setValue("Parent", accId); + seq.addSequenceFeature(sf4); + + // transcript not valid: + SequenceFeature sf5 = new SequenceFeature("transcript", "", 1, 2, 0f, + null); + sf5.setValue("Parent", accId); + seq.addSequenceFeature(sf5); + + // CDS not valid: + SequenceFeature sf6 = new SequenceFeature("transcript", "", 1, 2, 0f, + null); + sf6.setValue("Parent", accId); + seq.addSequenceFeature(sf6); + + List sfs = new EnsemblCdna() + .getIdentifyingFeatures(seq, accId); + assertFalse(sfs.contains(sf1)); + assertFalse(sfs.contains(sf2)); + assertTrue(sfs.contains(sf3)); + assertTrue(sfs.contains(sf4)); + assertFalse(sfs.contains(sf5)); + assertFalse(sfs.contains(sf6)); + } + + @Test(groups = "Functional") + public void testIsValidReference() throws Exception + { + EnsemblSequenceFetcher esq = new EnsemblCdna(); + Assert.assertTrue(esq.isValidReference("CCDS5863.1")); + Assert.assertTrue(esq.isValidReference("ENST00000288602")); + Assert.assertTrue(esq.isValidReference("ENSG00000288602")); + Assert.assertFalse(esq.isValidReference("ENSP00000288602")); + Assert.assertFalse(esq.isValidReference("ENST0000288602")); + // non-human species having a 3 character identifier included: + Assert.assertTrue(esq.isValidReference("ENSMUSG00000099398")); + } }