/*
- * Jalview - A Sequence Alignment Editor and Viewer
- * Copyright (C) 2007 AM Waterhouse, J Procter, G Barton, M Clamp, S Searle
- *
- * This program is free software; you can redistribute it and/or
- * modify it under the terms of the GNU General Public License
- * as published by the Free Software Foundation; either version 2
+ * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
+ * Copyright (C) $$Year-Rel$$ The Jalview Authors
+ *
+ * This file is part of Jalview.
+ *
+ * Jalview is free software: you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation, either version 3
* of the License, or (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
+ *
+ * Jalview is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty
+ * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
+ * PURPOSE. See the GNU General Public License for more details.
+ *
* You should have received a copy of the GNU General Public License
- * along with this program; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
+ * along with Jalview. If not, see <http://www.gnu.org/licenses/>.
+ * The Jalview Authors are detailed in the 'AUTHORS' file.
*/
package jalview.io;
-import java.io.*;
-import java.util.*;
+import jalview.datamodel.AlignmentAnnotation;
+import jalview.datamodel.AlignmentI;
+import jalview.datamodel.Sequence;
+import jalview.datamodel.SequenceGroup;
+import jalview.datamodel.SequenceI;
+import jalview.util.MessageManager;
-import jalview.datamodel.*;
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.Enumeration;
+import java.util.Hashtable;
+import java.util.List;
+import java.util.Vector;
/**
* DOCUMENT ME!
- *
+ *
* @author $author$
* @version $Revision$
*/
-public abstract class AlignFile
- extends FileParse
+public abstract class AlignFile extends FileParse implements AlignmentFileI
{
int noSeqs = 0;
+
int maxLength = 0;
+
/**
- * Sequences to be added to form a new alignment.
+ * Sequences to be added to form a new alignment. TODO: remove vector in this
+ * class
*/
- protected Vector seqs;
+ protected Vector<SequenceI> seqs;
+
/**
* annotation to be added to generated alignment object
*/
- protected Vector annotations;
+ protected Vector<AlignmentAnnotation> annotations;
+
+ /**
+ * SequenceGroups to be added to the alignment object
+ */
+ protected List<SequenceGroup> seqGroups;
+
/**
* Properties to be added to generated alignment object
*/
- protected Hashtable properties;
+ private Hashtable properties;
+
long start;
+
long end;
- boolean jvSuffix = true;
+
+ private boolean parseCalled;
/**
* Creates a new AlignFile object.
*/
public AlignFile()
{
+ // Shouldn't we init data structures (JBPNote: not sure - initData is for
+ // initialising the structures used for reading from a datasource, and the
+ // bare constructor hasn't got any datasource)
+ initData();
+ }
+
+ public AlignFile(SequenceI[] seqs)
+ {
+ this();
+ setSeqs(seqs);
}
/**
* Constructor which parses the data from a file of some specified type.
- * @param inFile Filename to read from.
- * @param type What type of file to read from (File, URL)
+ *
+ * @param dataObject
+ * Filename, URL or Pasted String to read from.
+ * @param sourceType
+ * What type of file to read from (File, URL, Pasted String)
+ */
+ public AlignFile(String dataObject, DataSourceType sourceType)
+ throws IOException
+ {
+ this(true, dataObject, sourceType);
+ }
+
+ /**
+ * Constructor which (optionally delays) parsing of data from a file of some
+ * specified type.
+ *
+ * @param parseImmediately
+ * if false, need to call 'doParse()' to begin parsing data
+ * @param dataObject
+ * Filename, URL or Pasted String to read from.
+ * @param sourceType
+ * What type of file to read from (File, URL)
+ * @throws IOException
+ */
+ public AlignFile(boolean parseImmediately, String dataObject,
+ DataSourceType sourceType)
+ throws IOException
+ {
+ super(dataObject, sourceType);
+ initData();
+ if (parseImmediately)
+ {
+ doParse();
+ }
+ }
+
+ /**
+ * Attempt to read from the position where some other parsing process left
+ * off.
+ *
+ * @param source
+ * @throws IOException
*/
- public AlignFile(String inFile, String type)
- throws IOException
+ public AlignFile(FileParse source) throws IOException
{
- super(inFile, type);
+ this(true, source);
+ }
+ /**
+ * Construct a new parser to read from the position where some other parsing
+ * process left
+ *
+ * @param parseImmediately
+ * if false, need to call 'doParse()' to begin parsing data
+ * @param source
+ */
+ public AlignFile(boolean parseImmediately, FileParse source)
+ throws IOException
+ {
+ super(source);
initData();
+ if (parseImmediately)
+ {
+ doParse();
+ }
+ }
+ /**
+ * called if parsing was delayed till after parser was constructed
+ *
+ * @throws IOException
+ */
+ public void doParse() throws IOException
+ {
+ if (parseCalled)
+ {
+ throw new IOException(
+ "Implementation error: Parser called twice for same data.\n"
+ + "Need to call initData() again before parsing can be reattempted.");
+ }
+ parseCalled = true;
parse();
+ // sets the index of each sequence in the alignment
+ for (int i = 0, c = seqs.size(); i < c; i++)
+ {
+ seqs.get(i).setIndex(i);
+ }
}
/**
* Return the seqs Vector
*/
- public Vector getSeqs()
+ public Vector<SequenceI> getSeqs()
{
return seqs;
}
+ public List<SequenceGroup> getSeqGroups()
+ {
+ return seqGroups;
+ }
+
/**
* Return the Sequences in the seqs Vector as an array of Sequences
*/
+ @Override
public SequenceI[] getSeqsAsArray()
{
SequenceI[] s = new SequenceI[seqs.size()];
for (int i = 0; i < seqs.size(); i++)
{
- s[i] = (SequenceI) seqs.elementAt(i);
+ s[i] = seqs.elementAt(i);
}
return s;
}
+
/**
- * called by AppletFormatAdapter to generate
- * an annotated alignment, rather than bare
- * sequences.
+ * called by AppletFormatAdapter to generate an annotated alignment, rather
+ * than bare sequences.
+ *
* @param al
*/
- public void addAnnotations(Alignment al)
+ @Override
+ public void addAnnotations(AlignmentI al)
{
addProperties(al);
for (int i = 0; i < annotations.size(); i++)
{
- al.addAnnotation(
- (AlignmentAnnotation) annotations.elementAt(i)
- );
+ // detect if annotations.elementAt(i) rna secondary structure
+ // if so then do:
+ /*
+ * SequenceFeature[] pairArray =
+ * Rna.GetBasePairsFromAlignmentAnnotation(annotations.elementAt(i));
+ * Rna.HelixMap(pairArray);
+ */
+ AlignmentAnnotation an = annotations.elementAt(i);
+ an.validateRangeAndDisplay();
+ al.addAnnotation(an);
}
}
+
/**
- * Add any additional information extracted
- * from the file to the alignment properties.
+ * register sequence groups on the alignment for **output**
+ *
+ * @param al
+ */
+ public void addSeqGroups(AlignmentI al)
+ {
+ this.seqGroups = al.getGroups();
+
+ }
+
+ /**
+ * Add any additional information extracted from the file to the alignment
+ * properties.
+ *
* @note implicitly called by addAnnotations()
* @param al
*/
- public void addProperties(Alignment al)
+ public void addProperties(AlignmentI al)
{
- if (properties!=null && properties.size()>0)
+ if (properties != null && properties.size() > 0)
{
Enumeration keys = properties.keys();
Enumeration vals = properties.elements();
}
}
}
+
/**
- * Store a non-null key-value pair in a hashtable used to set alignment properties
- * note: null keys will raise an error, null values will result in the key/value pair being silently ignored.
- * @param key - non-null key object
- * @param value - non-null value
+ * Store a non-null key-value pair in a hashtable used to set alignment
+ * properties note: null keys will raise an error, null values will result in
+ * the key/value pair being silently ignored.
+ *
+ * @param key
+ * - non-null key object
+ * @param value
+ * - non-null value
*/
protected void setAlignmentProperty(Object key, Object value)
{
- if (key==null)
+ if (key == null)
{
- throw new Error("Implementation error: Cannot have null alignment property key.");
+ throw new Error(
+ MessageManager
+ .getString("error.implementation_error_cannot_have_null_alignment"));
}
- if (value==null)
+ if (value == null)
{
return; // null properties are ignored.
}
- if (properties==null)
+ if (properties == null)
{
properties = new Hashtable();
}
properties.put(key, value);
}
+
protected Object getAlignmentProperty(Object key)
{
- if (properties!=null && key!=null)
+ if (properties != null && key != null)
{
return properties.get(key);
}
return null;
}
+
/**
* Initialise objects to store sequence data in.
*/
protected void initData()
{
- seqs = new Vector();
- annotations = new Vector();
+ seqs = new Vector<SequenceI>();
+ annotations = new Vector<AlignmentAnnotation>();
+ seqGroups = new ArrayList<SequenceGroup>();
+ parseCalled = false;
}
/**
* DOCUMENT ME!
- *
- * @param s DOCUMENT ME!
+ *
+ * @param s
+ * DOCUMENT ME!
*/
- protected void setSeqs(SequenceI[] s)
+ @Override
+ public void setSeqs(SequenceI[] s)
{
- seqs = new Vector();
+ seqs = new Vector<SequenceI>();
for (int i = 0; i < s.length; i++)
{
/**
* This method must be implemented to parse the contents of the file.
*/
- public abstract void parse()
- throws IOException;
-
- /**
- * Print out in alignment file format the Sequences in the seqs Vector.
- */
- public abstract String print();
-
- public void addJVSuffix(boolean b)
- {
- jvSuffix = b;
- }
+ public abstract void parse() throws IOException;
/**
* A general parser for ids.
- *
+ *
* @String id Id to be parsed
*/
Sequence parseId(String id)
if (space > -1)
{
seq = new Sequence(id.substring(0, space), "");
- seq.setDescription(id.substring(space + 1));
+ String desc = id.substring(space + 1);
+ seq.setDescription(desc);
+
+ /*
+ * it is tempting to parse Ensembl style gene description e.g.
+ * chromosome:GRCh38:7:140696688:140721955:1 and set the
+ * start position of the sequence, but this causes much confusion
+ * for reverse strand feature locations
+ */
}
else
{
}
/**
- * Creates the output id.
- * Adds prefix Uniprot format source|id
- * And suffix Jalview /start-end
- *
+ * Creates the output id. Adds prefix Uniprot format source|id and optionally
+ * suffix Jalview /start-end
+ *
+ * @param jvsuffix
+ *
* @String id Id to be parsed
*/
+ String printId(SequenceI seq, boolean jvsuffix)
+ {
+ return seq.getDisplayId(jvsuffix);
+ }
+
String printId(SequenceI seq)
{
- return seq.getDisplayId(jvSuffix);
+ return printId(seq, true);
}
+
/**
- * vector of String[] treeName, newickString pairs
+ * vector of String[] treeName, newickString pairs
*/
- Vector newickStrings=null;
-
+ Vector<String[]> newickStrings = null;
+
protected void addNewickTree(String treeName, String newickString)
{
if (newickStrings == null)
{
- newickStrings = new Vector();
+ newickStrings = new Vector<String[]>();
}
- newickStrings.add(new String[] { treeName, newickString});
+ newickStrings.addElement(new String[] { treeName, newickString });
}
protected int getTreeCount()
{
- if (newickStrings==null)
+ return newickStrings == null ? 0 : newickStrings.size();
+ }
+
+ @Override
+ public void addGroups(AlignmentI al)
+ {
+
+ for (SequenceGroup sg : getSeqGroups())
{
- return 0;
+ al.addGroup(sg);
}
- return newickStrings.size();
}
}