X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=src%2Fjalview%2Fio%2FPIRFile.java;h=b958456265cb655472c75d783329a3ab2a07887f;hb=4891120c866fcd3516b270915d0db2d31a4815e0;hp=724fea8016240612bc28241d53653f4b95a6c0be;hpb=69f23b44e8ce05b33fca23ffb3774c285a23dd9b;p=jalview.git diff --git a/src/jalview/io/PIRFile.java b/src/jalview/io/PIRFile.java index 724fea8..b958456 100755 --- a/src/jalview/io/PIRFile.java +++ b/src/jalview/io/PIRFile.java @@ -21,12 +21,13 @@ package jalview.io; import java.io.*; import java.util.*; -import jalview.analysis.*; import jalview.datamodel.*; public class PIRFile extends AlignFile { + public static boolean useModellerOutput = false; + Vector words = new Vector(); //Stores the words in a line after splitting public PIRFile() @@ -44,12 +45,11 @@ public class PIRFile super(inFile, type); } - public void parse() + public void parse() throws IOException { - try - { StringBuffer sequence; String line = null; + ModellerDescription md; while ( (line = nextLine()) != null) { @@ -88,17 +88,20 @@ public class PIRFile { sequence.setLength(sequence.length() - 1); newSeq.setSequence(sequence.toString()); + if (!isValidProteinSequence(newSeq.getSequence())) + { + throw new IOException(AppletFormatAdapter.INVALID_CHARACTERS + +" : "+ newSeq.getName() + +" : "+invalidCharacter); + } + seqs.addElement(newSeq); - ModellerDescription md = new ModellerDescription(newSeq. - getDescription()); + + md = new ModellerDescription(newSeq. + getDescription()); md.updateSequenceI(newSeq); } } - } - catch (Exception ex) - { - ex.printStackTrace(); - } } public String print() @@ -112,17 +115,28 @@ public class PIRFile int len = 72; StringBuffer out = new StringBuffer(); int i = 0; + ModellerDescription md; while ( (i < s.length) && (s[i] != null)) { String seq = s[i].getSequence(); seq = seq + "*"; + if (is_NA) { - // modeller doesn't really do nucleotides, so we don't do anything fancy - // Nucleotide sequence tags should have a >DL; prefix - out.append(">P1;" + s[i].getName() + "\n"); // JBPNote Should change >P to >N + // modeller doesn't really do nucleotides, so we don't do anything fancy + // Official tags area as follows, for now we'll use P1 and DL + // Protein (complete) P1 + // Protein (fragment) F1 + // DNA (linear) Dl + // DNA (circular) DC + // RNA (linear) RL + // RNA (circular) RC + // tRNA N3 + // other functional RNA N1 + + out.append(">N1;" + s[i].getName() + "\n"); if (s[i].getDescription() == null) { out.append(s[i].getName() + " " + @@ -136,9 +150,23 @@ public class PIRFile } else { - out.append(">P1;" + s[i].getName() + "\n"); - ModellerDescription md = new ModellerDescription(s[i]); - out.append(md.getDescriptionLine() + "\n"); + + if(useModellerOutput) + { + out.append(">P1;" + s[i].getName() + "\n"); + md = new ModellerDescription(s[i]); + out.append(md.getDescriptionLine() + "\n"); + } + else + { + out.append(">P1;" + printId(s[i]) + "\n"); + if (s[i].getDescription() != null) + out.append(s[i].getDescription() + "\n"); + else + out.append(s[i].getName() + " " + + (s[i].getEnd() - s[i].getStart() + 1) + + " residues\n"); + } } int nochunks = (seq.length() / len) + 1;