2 * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
3 * Copyright (C) $$Year-Rel$$ The Jalview Authors
5 * This file is part of Jalview.
7 * Jalview is free software: you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation, either version 3
10 * of the License, or (at your option) any later version.
12 * Jalview is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty
14 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
15 * PURPOSE. See the GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Jalview. If not, see <http://www.gnu.org/licenses/>.
19 * The Jalview Authors are detailed in the 'AUTHORS' file.
23 import jalview.datamodel.Sequence;
24 import jalview.datamodel.SequenceI;
26 import java.io.IOException;
27 import java.util.Vector;
29 public class PIRFile extends AlignFile
31 public static boolean useModellerOutput = false;
33 Vector words = new Vector(); // Stores the words in a line after splitting
39 public PIRFile(String inFile, DataSourceType sourceType)
42 super(inFile, sourceType);
45 public PIRFile(FileParse source) throws IOException
51 public void parse() throws IOException
53 StringBuffer sequence;
55 ModellerDescription md;
57 while ((line = nextLine()) != null)
59 if (line.length() == 0)
61 // System.out.println("blank line");
64 if (line.indexOf("C;") == 0 || line.indexOf("#") == 0)
68 Sequence newSeq = parseId(line.substring(line.indexOf(";") + 1));
70 sequence = new StringBuffer();
72 newSeq.setDescription(nextLine()); // this is the title line
74 boolean starFound = false;
79 sequence.append(line);
86 if (line.indexOf("*") > -1)
92 if (sequence.length() > 0)
94 sequence.setLength(sequence.length() - 1);
95 newSeq.setSequence(sequence.toString());
97 seqs.addElement(newSeq);
99 md = new ModellerDescription(newSeq.getDescription());
100 md.updateSequenceI(newSeq);
106 public String print()
108 return print(getSeqsAsArray());
111 public String print(SequenceI[] s)
113 boolean is_NA = jalview.util.Comparison.isNucleotide(s);
115 StringBuffer out = new StringBuffer();
117 ModellerDescription md;
119 while ((i < s.length) && (s[i] != null))
121 String seq = s[i].getSequenceAsString();
126 // modeller doesn't really do nucleotides, so we don't do anything fancy
127 // Official tags area as follows, for now we'll use P1 and DL
128 // Protein (complete) P1
129 // Protein (fragment) F1
135 // other functional RNA N1
137 out.append(">N1;" + s[i].getName());
139 if (s[i].getDescription() == null)
141 out.append(s[i].getName() + " "
142 + (s[i].getEnd() - s[i].getStart() + 1));
143 out.append(is_NA ? " bases" : " residues");
148 out.append(s[i].getDescription());
155 if (useModellerOutput)
157 out.append(">P1;" + s[i].getName());
159 md = new ModellerDescription(s[i]);
160 out.append(md.getDescriptionLine());
165 out.append(">P1;" + printId(s[i]));
167 if (s[i].getDescription() != null)
169 out.append(s[i].getDescription());
174 out.append(s[i].getName() + " "
175 + (s[i].getEnd() - s[i].getStart() + 1) + " residues");
180 int nochunks = (seq.length() / len)
181 + (seq.length() % len > 0 ? 1 : 0);
183 for (int j = 0; j < nochunks; j++)
186 int end = start + len;
188 if (end < seq.length())
190 out.append(seq.substring(start, end));
193 else if (start < seq.length())
195 out.append(seq.substring(start));
203 return out.toString();