X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=src%2Fjalview%2Fio%2FIdentifyFile.java;h=86036fde9cef0107ace8392e3f5e21444246b907;hb=a96d51f58325f8429c5792ae554243de5628d62a;hp=18e1a6a2a340e3f92476231bbc9197c721dce431;hpb=b5dceeaf4112cd63aa1642dd8851b3ec19a7c81e;p=jalview.git diff --git a/src/jalview/io/IdentifyFile.java b/src/jalview/io/IdentifyFile.java index 18e1a6a..86036fd 100755 --- a/src/jalview/io/IdentifyFile.java +++ b/src/jalview/io/IdentifyFile.java @@ -1,79 +1,221 @@ -/******************** - * 2004 Jalview Reengineered - * Barton Group - * Dundee University - * - * AM Waterhouse - *******************/ - -package jalview.io; - -import java.io.*; -import java.net.*; - -public class IdentifyFile -{ - public static String Identify(String file, String protocol) - { - String reply = "PFAM"; - try{ - - BufferedReader reader = null; - - if(protocol.equals("File")) - reader = new BufferedReader(new FileReader(file)); - - else if (protocol.equals("URL")) - { - reply = "URL NOT FOUND"; - URL url = new URL(file); - reader = new BufferedReader(new InputStreamReader( url.openStream() ) ); - reply = "error"; - } - else if( protocol.equals("Paste")) - reader = new BufferedReader( new StringReader(file) ); - - - String data; - while( (data=reader.readLine())!=null) - { - data = data.toUpperCase(); - if(data.indexOf("#")==0 || data.length()<1) - continue; - - if(data.indexOf("PILEUP")>-1) - { - reply = "MSF"; - break; - } - else if(data.indexOf("CLUSTAL")>-1) - { - reply = "CLUSTAL"; - break; - } - else if(data.indexOf(">P1;")>-1 || data.indexOf(">DL;")>-1) - { - reply = "PIR"; - break; - } - else if(data.indexOf(">")>-1) - { - // could be BLC file, read next line to confirm - data = reader.readLine(); - if(data.indexOf(">")>-1) - reply = "BLC"; - else - reply = "FASTA"; - - break; - } - } - reader.close(); - } - catch(Exception ex){ex.printStackTrace();} - - return reply; - } - - -} +/* + * Jalview - A Sequence Alignment Editor and Viewer + * Copyright (C) 2007 AM Waterhouse, J Procter, G Barton, M Clamp, S Searle + * + * This program is free software; you can redistribute it and/or + * modify it under the terms of the GNU General Public License + * as published by the Free Software Foundation; either version 2 + * of the License, or (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA + */ +package jalview.io; + +import java.io.*; +import java.net.*; + +/** + * DOCUMENT ME! + * + * @author $author$ + * @version $Revision$ + */ +public class IdentifyFile +{ + /** + * Identify a datasource's file content. + * @note Do not use this method + * for stream sources - create a FileParse object instead. + * + * @param file DOCUMENT ME! + * @param protocol DOCUMENT ME! + * @return ID String + */ + public String Identify(String file, String protocol) + { + FileParse parser = null; + try { + parser = new FileParse(file, protocol); + if (parser.isValid()) { + return Identify(parser); + } + } catch (Exception e) { + System.err.println("Error whilst identifying"); + e.printStackTrace(System.err); + } + if (parser!=null) + return parser.errormessage; + return "UNIDENTIFIED FILE PARSING ERROR"; + } + public String Identify(FileParse source) { + return Identify(source, true); // preserves original behaviour prior to version 2.3 + } + /** + * Identify contents of source, closing it or resetting source to start afterwards. + * @param source + * @param closeSource + * @return filetype string + */ + public String Identify(FileParse source, boolean closeSource) { + String reply = "PFAM"; + String data; + int length=0; + boolean lineswereskipped=false; + boolean isBinary = false; // true if length is non-zero and non-printable characters are encountered + try { + while ( (data = source.nextLine()) != null) + { + length+=data.length(); + if (!lineswereskipped) + { + for (int i=0;!isBinary && i-1 || fileStr.lastIndexOf(".zip")>-1) + { + reply = "Jalview"; + } + } + if (!lineswereskipped && data.startsWith("PK")) { + reply="Jalview"; // archive. + break; + } + } + data = data.toUpperCase(); + + if ( (data.indexOf("# STOCKHOLM") > -1)) + { + reply = "STH"; + + break; + } + + if ((data.length() < 1) || (data.indexOf("#") == 0)) + { + lineswereskipped=true; + continue; + } + + if (data.indexOf("PILEUP") > -1) + { + reply = "PileUp"; + + break; + } + + if ( (data.indexOf("//") == 0) || + ( (data.indexOf("!!") > -1) && + (data.indexOf("!!") < data.indexOf( + "_MULTIPLE_ALIGNMENT ")))) + { + reply = "MSF"; + + break; + } + else if (data.indexOf("CLUSTAL") > -1) + { + reply = "CLUSTAL"; + + break; + } + else if ( (data.indexOf(">P1;") > -1) || + (data.indexOf(">DL;") > -1)) + { + reply = "PIR"; + + break; + } + else if (data.indexOf(">") > -1) + { + // could be BLC file, read next line to confirm + data = source.nextLine(); + + if (data.indexOf(">") > -1) + { + reply = "BLC"; + } + else + { + //Is this a single line BLC file? + source.nextLine(); + String data2 = source.nextLine(); + if (data2 != null + && data.indexOf("*") > -1 + && data.indexOf("*") == data2.indexOf("*")) + { + reply = "BLC"; + } + else + { + reply = "FASTA"; + // TODO : AMSA File is indicated if there is annotation in the FASTA file - but FASTA will automatically generate this at the mo. + } + } + break; + } + else if (data.indexOf("HEADER") == 0 || + data.indexOf("ATOM") == 0) + { + reply = "PDB"; + break; + } + else if (!lineswereskipped + && data.charAt(0)!='*' + && data.charAt(0)!=' ' + && data.indexOf(":") < data.indexOf(",")) // && data.indexOf(",") [ ...]"); + } + } +}