-/*\r
-* Jalview - A Sequence Alignment Editor and Viewer\r
-* Copyright (C) 2006 AM Waterhouse, J Procter, G Barton, M Clamp, S Searle\r
-*\r
-* This program is free software; you can redistribute it and/or\r
-* modify it under the terms of the GNU General Public License\r
-* as published by the Free Software Foundation; either version 2\r
-* of the License, or (at your option) any later version.\r
-*\r
-* This program is distributed in the hope that it will be useful,\r
-* but WITHOUT ANY WARRANTY; without even the implied warranty of\r
-* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the\r
-* GNU General Public License for more details.\r
-*\r
-* You should have received a copy of the GNU General Public License\r
-* along with this program; if not, write to the Free Software\r
-* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA\r
-*/\r
-package jalview.io;\r
-\r
-import jalview.datamodel.*;\r
-\r
-import java.io.*;\r
-\r
-import java.util.*;\r
-\r
-\r
-/**\r
- * DOCUMENT ME!\r
- *\r
- * @author $author$\r
- * @version $Revision$\r
- */\r
-public abstract class AlignFile extends FileParse\r
-{\r
- int noSeqs = 0;\r
- int maxLength = 0;\r
- Vector seqs;\r
- Vector annotations;\r
- long start;\r
- long end;\r
- boolean jvSuffix = true;\r
-\r
- /**\r
- * Creates a new AlignFile object.\r
- */\r
- public AlignFile()\r
- {\r
- }\r
-\r
-\r
- /**\r
- * Constructor which parses the data from a file of some specified type.\r
- * @param inFile Filename to read from.\r
- * @param type What type of file to read from (File, URL)\r
- */\r
- public AlignFile(String inFile, String type) throws IOException\r
- {\r
- super(inFile, type);\r
-\r
- initData();\r
-\r
- parse();\r
- }\r
-\r
- /**\r
- * Return the seqs Vector\r
- */\r
- public Vector getSeqs()\r
- {\r
- return seqs;\r
- }\r
-\r
- /**\r
- * Return the Sequences in the seqs Vector as an array of Sequences\r
- */\r
- public SequenceI[] getSeqsAsArray()\r
- {\r
- SequenceI[] s = new SequenceI[seqs.size()];\r
-\r
- for (int i = 0; i < seqs.size(); i++)\r
- {\r
- s[i] = (SequenceI) seqs.elementAt(i);\r
- }\r
-\r
- return s;\r
- }\r
-\r
- public void addAnnotations(Alignment al)\r
- {\r
- for(int i=0; i<annotations.size(); i++)\r
- {\r
- al.addAnnotation(\r
- (AlignmentAnnotation)annotations.elementAt(i)\r
- );\r
- }\r
-\r
- }\r
-\r
- /**\r
- * Initialise objects to store sequence data in.\r
- */\r
- protected void initData()\r
- {\r
- seqs = new Vector();\r
- annotations = new Vector();\r
- }\r
-\r
- /**\r
- * DOCUMENT ME!\r
- *\r
- * @param s DOCUMENT ME!\r
- */\r
- protected void setSeqs(SequenceI[] s)\r
- {\r
- seqs = new Vector();\r
-\r
- for (int i = 0; i < s.length; i++)\r
- {\r
- seqs.addElement(s[i]);\r
- }\r
- }\r
-\r
- // Checks whether sequence is valid aa characters\r
- protected boolean isValidProteinSequence(char [] sequence)\r
- {\r
- for (int i = 0; i < sequence.length; i++)\r
- if (jalview.schemes.ResidueProperties.aaIndex[sequence[i]]==-1)\r
- {\r
- invalidCharacter = sequence[i];\r
- return false;\r
- }\r
-\r
- return true;\r
- }\r
-\r
- char invalidCharacter;\r
-\r
- /**\r
- * This method must be implemented to parse the contents of the file.\r
- */\r
- public abstract void parse() throws IOException;\r
-\r
- /**\r
- * Print out in alignment file format the Sequences in the seqs Vector.\r
- */\r
- public abstract String print();\r
-\r
- public void addJVSuffix(boolean b)\r
- {\r
- jvSuffix = b;\r
- }\r
-\r
- /**\r
- * A general parser for ids.\r
- *\r
- * @String id Id to be parsed\r
- */\r
- Sequence parseId(String id)\r
- {\r
- Sequence seq = null;\r
- id = id.trim();\r
- int space = id.indexOf(" ");\r
- if(space>-1)\r
- {\r
- seq = new Sequence(id.substring(0, space),"");\r
- seq.setDescription(id.substring(space+1));\r
- }\r
- else\r
- {\r
- seq = new Sequence(id, "");\r
- }\r
-\r
- return seq;\r
- }\r
-\r
- /**\r
- * Creates the output id.\r
- * Adds prefix Uniprot format source|id\r
- * And suffix Jalview /start-end\r
- *\r
- * @String id Id to be parsed\r
- */\r
- String printId(SequenceI seq)\r
- {\r
- return seq.getDisplayId(jvSuffix);\r
- }\r
-\r
-}\r
+/*
+ * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
+ * Copyright (C) $$Year-Rel$$ The Jalview Authors
+ *
+ * This file is part of Jalview.
+ *
+ * Jalview is free software: you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation, either version 3
+ * of the License, or (at your option) any later version.
+ *
+ * Jalview is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty
+ * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
+ * PURPOSE. See the GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Jalview. If not, see <http://www.gnu.org/licenses/>.
+ * The Jalview Authors are detailed in the 'AUTHORS' file.
+ */
+package jalview.io;
+
+import jalview.datamodel.AlignmentAnnotation;
+import jalview.datamodel.AlignmentI;
+import jalview.datamodel.Sequence;
+import jalview.datamodel.SequenceGroup;
+import jalview.datamodel.SequenceI;
+import jalview.util.MessageManager;
+
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.Enumeration;
+import java.util.Hashtable;
+import java.util.List;
+import java.util.Vector;
+
+/**
+ * DOCUMENT ME!
+ *
+ * @author $author$
+ * @version $Revision$
+ */
+public abstract class AlignFile extends FileParse
+ implements AlignmentFileReaderI, AlignmentFileWriterI
+{
+ int noSeqs = 0;
+
+ int maxLength = 0;
+
+ /**
+ * Sequences to be added to form a new alignment. TODO: remove vector in this
+ * class
+ */
+ protected Vector<SequenceI> seqs;
+
+ /**
+ * annotation to be added to generated alignment object
+ */
+ protected Vector<AlignmentAnnotation> annotations;
+
+ /**
+ * SequenceGroups to be added to the alignment object
+ */
+ protected List<SequenceGroup> seqGroups;
+
+ /**
+ * Properties to be added to generated alignment object
+ */
+ private Hashtable properties;
+
+ long start;
+
+ long end;
+
+ /**
+ * true if parse() has been called
+ */
+ private boolean parseCalled = false;
+
+ private boolean parseImmediately = true;
+
+ /**
+ * @return if doParse() was called at construction time
+ */
+ protected boolean isParseImmediately()
+ {
+ return parseImmediately;
+ }
+
+ /**
+ * Creates a new AlignFile object.
+ */
+ public AlignFile()
+ {
+ // Shouldn't we init data structures (JBPNote: not sure - initData is for
+ // initialising the structures used for reading from a datasource, and the
+ // bare constructor hasn't got any datasource)
+ initData();
+ }
+
+ public AlignFile(SequenceI[] seqs)
+ {
+ this();
+ setSeqs(seqs);
+ }
+
+ /**
+ * Constructor which parses the data from a file of some specified type.
+ *
+ * @param dataObject
+ * Filename, URL or Pasted String to read from.
+ * @param sourceType
+ * What type of file to read from (File, URL, Pasted String)
+ */
+ public AlignFile(String dataObject, DataSourceType sourceType)
+ throws IOException
+ {
+ this(true, dataObject, sourceType);
+ }
+
+ /**
+ * Constructor which (optionally delays) parsing of data from a file of some
+ * specified type.
+ *
+ * @param parseImmediately
+ * if false, need to call 'doParse()' to begin parsing data
+ * @param dataObject
+ * Filename, URL or Pasted String to read from.
+ * @param sourceType
+ * What type of file to read from (File, URL)
+ * @throws IOException
+ */
+ public AlignFile(boolean parseImmediately, String dataObject,
+ DataSourceType sourceType) throws IOException
+ {
+ super(dataObject, sourceType);
+ initData();
+ if (parseImmediately)
+ {
+ doParse();
+ }
+ }
+
+ /**
+ * Attempt to read from the position where some other parsing process left
+ * off.
+ *
+ * @param source
+ * @throws IOException
+ */
+ public AlignFile(FileParse source) throws IOException
+ {
+ this(true, source);
+ }
+
+ /**
+ * Construct a new parser to read from the position where some other parsing
+ * process left
+ *
+ * @param parseImmediately
+ * if false, need to call 'doParse()' to begin parsing data
+ * @param source
+ */
+ public AlignFile(boolean parseImmediately, FileParse source)
+ throws IOException
+ {
+ super(source);
+ initData();
+
+ // stash flag in case parse needs to know if it has to autoconfigure or was
+ // configured after construction
+ this.parseImmediately = parseImmediately;
+
+ if (parseImmediately)
+ {
+ doParse();
+ }
+ }
+
+ /**
+ * called if parsing was delayed till after parser was constructed
+ *
+ * @throws IOException
+ */
+ public void doParse() throws IOException
+ {
+ if (parseCalled)
+ {
+ throw new IOException(
+ "Implementation error: Parser called twice for same data.\n"
+ + "Need to call initData() again before parsing can be reattempted.");
+ }
+ parseCalled = true;
+ parse();
+ }
+
+ /**
+ * Return the seqs Vector
+ */
+ public Vector<SequenceI> getSeqs()
+ {
+ return seqs;
+ }
+
+ public List<SequenceGroup> getSeqGroups()
+ {
+ return seqGroups;
+ }
+
+ /**
+ * Return the Sequences in the seqs Vector as an array of Sequences
+ */
+ @Override
+ public SequenceI[] getSeqsAsArray()
+ {
+ SequenceI[] s = new SequenceI[seqs.size()];
+
+ for (int i = 0; i < seqs.size(); i++)
+ {
+ s[i] = seqs.elementAt(i);
+ }
+
+ return s;
+ }
+
+ /**
+ * called by AppletFormatAdapter to generate an annotated alignment, rather
+ * than bare sequences.
+ *
+ * @param al
+ */
+ @Override
+ public void addAnnotations(AlignmentI al)
+ {
+ addProperties(al);
+ for (int i = 0; i < annotations.size(); i++)
+ {
+ // detect if annotations.elementAt(i) rna secondary structure
+ // if so then do:
+ /*
+ * SequenceFeature[] pairArray =
+ * Rna.GetBasePairsFromAlignmentAnnotation(annotations.elementAt(i));
+ * Rna.HelixMap(pairArray);
+ */
+ AlignmentAnnotation an = annotations.elementAt(i);
+ an.validateRangeAndDisplay();
+ al.addAnnotation(an);
+ }
+
+ }
+
+ /**
+ * register sequence groups on the alignment for **output**
+ *
+ * @param al
+ */
+ public void addSeqGroups(AlignmentI al)
+ {
+ this.seqGroups = al.getGroups();
+
+ }
+
+ /**
+ * Add any additional information extracted from the file to the alignment
+ * properties.
+ *
+ * @note implicitly called by addAnnotations()
+ * @param al
+ */
+ public void addProperties(AlignmentI al)
+ {
+ if (properties != null && properties.size() > 0)
+ {
+ Enumeration keys = properties.keys();
+ Enumeration vals = properties.elements();
+ while (keys.hasMoreElements())
+ {
+ al.setProperty(keys.nextElement(), vals.nextElement());
+ }
+ }
+ }
+
+ /**
+ * Store a non-null key-value pair in a hashtable used to set alignment
+ * properties note: null keys will raise an error, null values will result in
+ * the key/value pair being silently ignored.
+ *
+ * @param key
+ * - non-null key object
+ * @param value
+ * - non-null value
+ */
+ protected void setAlignmentProperty(Object key, Object value)
+ {
+ if (key == null)
+ {
+ throw new Error(MessageManager.getString(
+ "error.implementation_error_cannot_have_null_alignment"));
+ }
+ if (value == null)
+ {
+ return; // null properties are ignored.
+ }
+ if (properties == null)
+ {
+ properties = new Hashtable();
+ }
+ properties.put(key, value);
+ }
+
+ protected Object getAlignmentProperty(Object key)
+ {
+ if (properties != null && key != null)
+ {
+ return properties.get(key);
+ }
+ return null;
+ }
+
+ /**
+ * Initialise objects to store sequence data in.
+ */
+ protected void initData()
+ {
+ seqs = new Vector<>();
+ annotations = new Vector<>();
+ seqGroups = new ArrayList<>();
+ parseCalled = false;
+ }
+
+ /**
+ * DOCUMENT ME!
+ *
+ * @param s
+ * DOCUMENT ME!
+ */
+ @Override
+ public void setSeqs(SequenceI[] s)
+ {
+ seqs = new Vector<>();
+
+ for (int i = 0; i < s.length; i++)
+ {
+ seqs.addElement(s[i]);
+ }
+ }
+
+ /**
+ * This method must be implemented to parse the contents of the file.
+ */
+ public abstract void parse() throws IOException;
+
+ /**
+ * A general parser for ids.
+ *
+ * @String id Id to be parsed
+ */
+ Sequence parseId(String id)
+ {
+ Sequence seq = null;
+ id = id.trim();
+ int space = id.indexOf(" ");
+ if (space > -1)
+ {
+ seq = new Sequence(id.substring(0, space), "");
+ String desc = id.substring(space + 1);
+ seq.setDescription(desc);
+
+ /*
+ * it is tempting to parse Ensembl style gene description e.g.
+ * chromosome:GRCh38:7:140696688:140721955:1 and set the
+ * start position of the sequence, but this causes much confusion
+ * for reverse strand feature locations
+ */
+ }
+ else
+ {
+ seq = new Sequence(id, "");
+ }
+
+ return seq;
+ }
+
+ /**
+ * Creates the output id. Adds prefix Uniprot format source|id and optionally
+ * suffix Jalview /start-end
+ *
+ * @param jvsuffix
+ *
+ * @String id Id to be parsed
+ */
+ String printId(SequenceI seq, boolean jvsuffix)
+ {
+ return seq.getDisplayId(jvsuffix);
+ }
+
+ String printId(SequenceI seq)
+ {
+ return printId(seq, true);
+ }
+
+ /**
+ * vector of String[] treeName, newickString pairs
+ */
+ Vector<String[]> newickStrings = null;
+
+ protected void addNewickTree(String treeName, String newickString)
+ {
+ if (newickStrings == null)
+ {
+ newickStrings = new Vector<>();
+ }
+ newickStrings.addElement(new String[] { treeName, newickString });
+ }
+
+ protected int getTreeCount()
+ {
+ return newickStrings == null ? 0 : newickStrings.size();
+ }
+
+ @Override
+ public void addGroups(AlignmentI al)
+ {
+
+ for (SequenceGroup sg : getSeqGroups())
+ {
+ al.addGroup(sg);
+ }
+ }
+
+ protected void addSequence(SequenceI seq)
+ {
+ seqs.add(seq);
+ }
+
+ /**
+ * Used only for hmmer statistics, so should probably be removed at some
+ * point. TODO remove this
+ *
+ * @return
+ */
+ public Vector<AlignmentAnnotation> getAnnotations()
+ {
+ return annotations;
+ }
+
+}