X-Git-Url: http://source.jalview.org/gitweb/?a=blobdiff_plain;f=src%2Fjalview%2Fanalysis%2FAAFrequency.java;h=2c1a998a11424efa84f470ab46d8dc8e3ebecb07;hb=a8f483d04205bb8273ee311c12968b7e86d205fa;hp=d56fb01ec54b4a71f77db484e6b9e58bc370c5f9;hpb=bbfdb203ce3a889600caa52478478b75ab03809f;p=jalview.git diff --git a/src/jalview/analysis/AAFrequency.java b/src/jalview/analysis/AAFrequency.java index d56fb01..2c1a998 100755 --- a/src/jalview/analysis/AAFrequency.java +++ b/src/jalview/analysis/AAFrequency.java @@ -1,24 +1,26 @@ /* - * Jalview - A Sequence Alignment Editor and Viewer (Version 2.7) - * Copyright (C) 2011 J Procter, AM Waterhouse, J Engelhardt, LM Lui, G Barton, M Clamp, S Searle + * Jalview - A Sequence Alignment Editor and Viewer (Version 2.8.2) + * Copyright (C) 2014 The Jalview Authors * * This file is part of Jalview. * * Jalview is free software: you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. - * + * * Jalview is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty * of MERCHANTABILITY or FITNESS FOR A PARTICULAR * PURPOSE. See the GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along with Jalview. If not, see . + * The Jalview Authors are detailed in the 'AUTHORS' file. */ package jalview.analysis; import java.util.*; +import jalview.util.Format; import jalview.datamodel.*; /** @@ -44,36 +46,38 @@ public class AAFrequency public static final String PROFILE = "P"; - public static final Hashtable[] calculate(Vector sequences, int start, - int end) + public static final Hashtable[] calculate(List list, + int start, int end) { - return calculate(sequences, start, end, false); + return calculate(list, start, end, false); } - public static final Hashtable[] calculate(Vector sequences, int start, - int end, boolean profile) + public static final Hashtable[] calculate(List sequences, + int start, int end, boolean profile) { SequenceI[] seqs = new SequenceI[sequences.size()]; int width = 0; - for (int i = 0; i < sequences.size(); i++) + synchronized (sequences) { - seqs[i] = (SequenceI) sequences.elementAt(i); - if (seqs[i].getLength() > width) + for (int i = 0; i < sequences.size(); i++) { - width = seqs[i].getLength(); + seqs[i] = sequences.get(i); + if (seqs[i].getLength() > width) + { + width = seqs[i].getLength(); + } } - } - Hashtable[] reply = new Hashtable[width]; - - if (end >= width) - { - end = width; - } + Hashtable[] reply = new Hashtable[width]; - calculate(seqs, start, end, reply, profile); + if (end >= width) + { + end = width; + } - return reply; + calculate(seqs, start, end, reply, profile); + return reply; + } } public static final void calculate(SequenceI[] sequences, int start, @@ -88,7 +92,7 @@ public class AAFrequency Hashtable residueHash; int maxCount, nongap, i, j, v, jSize = sequences.length; String maxResidue; - char c; + char c='-'; float percentage; int[] values = new int[255]; @@ -102,12 +106,13 @@ public class AAFrequency maxResidue = ""; nongap = 0; values = new int[255]; - + for (j = 0; j < jSize; j++) { - if (sequences[j]==null) + if (sequences[j] == null) { - System.err.println("WARNING: Consensus skipping null sequence - possible race condition."); + System.err + .println("WARNING: Consensus skipping null sequence - possible race condition."); continue; } seq = sequences[j].getSequence(); @@ -139,8 +144,11 @@ public class AAFrequency values['-']++; } } - - for (v = 'A'; v < 'Z'; v++) + if (jSize==1) + { + maxResidue = String.valueOf(c); + maxCount=1; + } else {for (v = 'A'; v < 'Z'; v++) { if (values[v] < 2 || values[v] < maxCount) { @@ -157,7 +165,7 @@ public class AAFrequency } maxCount = values[v]; } - + } if (maxResidue.length() == 0) { maxResidue = "-"; @@ -171,11 +179,15 @@ public class AAFrequency residueHash.put(MAXCOUNT, new Integer(maxCount)); residueHash.put(MAXRESIDUE, maxResidue); - percentage = ((float) maxCount * 100) / (float) jSize; + percentage = ((float) maxCount * 100) / jSize; residueHash.put(PID_GAPS, new Float(percentage)); - percentage = ((float) maxCount * 100) / (float) nongap; + if (nongap>0) { + // calculate for non-gapped too + percentage = ((float) maxCount * 100) / nongap; + } residueHash.put(PID_NOGAPS, new Float(percentage)); + result[i] = residueHash; } } @@ -191,14 +203,15 @@ public class AAFrequency * @param width * @param ignoreGapsInConsensusCalculation * @param includeAllConsSymbols + * @param nseq */ public static void completeConsensus(AlignmentAnnotation consensus, Hashtable[] hconsensus, int iStart, int width, boolean ignoreGapsInConsensusCalculation, - boolean includeAllConsSymbols) + boolean includeAllConsSymbols, long nseq) { completeConsensus(consensus, hconsensus, iStart, width, - ignoreGapsInConsensusCalculation, includeAllConsSymbols, null); // new + ignoreGapsInConsensusCalculation, includeAllConsSymbols, null, nseq); // new // char[] // { 'A', 'C', 'G', 'T', 'U' }); } @@ -206,7 +219,7 @@ public class AAFrequency public static void completeConsensus(AlignmentAnnotation consensus, Hashtable[] hconsensus, int iStart, int width, boolean ignoreGapsInConsensusCalculation, - boolean includeAllConsSymbols, char[] alphabet) + boolean includeAllConsSymbols, char[] alphabet, long nseq) { float tval, value; if (consensus == null || consensus.annotations == null @@ -216,9 +229,27 @@ public class AAFrequency // initialised properly return; } + String fmtstr="%3.1f"; + int precision=0; + while (nseq>=10) { + precision++; + nseq/=10; + } + final Format fmt; + if (precision>1) + { + //if (precision>2) + { + fmtstr = "%"+(2+precision)+"."+(precision)+"f"; + } + fmt = new Format(fmtstr); + } else { + fmt = null; + } for (int i = iStart; i < width; i++) { - if (i >= hconsensus.length) + Hashtable hci; + if (i >= hconsensus.length || ((hci = hconsensus[i]) == null)) { // happens if sequences calculated over were shorter than alignment // width @@ -226,25 +257,30 @@ public class AAFrequency continue; } value = 0; + Float fv; if (ignoreGapsInConsensusCalculation) { - value = ((Float) hconsensus[i].get(AAFrequency.PID_NOGAPS)) - .floatValue(); + fv = (Float) hci.get(AAFrequency.PID_NOGAPS); } else { - value = ((Float) hconsensus[i].get(AAFrequency.PID_GAPS)) - .floatValue(); + fv = (Float) hci.get(AAFrequency.PID_GAPS); } - - String maxRes = hconsensus[i].get(AAFrequency.MAXRESIDUE).toString(); - String mouseOver = hconsensus[i].get(AAFrequency.MAXRESIDUE) + " "; + if (fv == null) + { + consensus.annotations[i] = null; + // data has changed below us .. give up and + continue; + } + value = fv.floatValue(); + String maxRes = hci.get(AAFrequency.MAXRESIDUE).toString(); + String mouseOver = hci.get(AAFrequency.MAXRESIDUE) + " "; if (maxRes.length() > 1) { mouseOver = "[" + maxRes + "] "; maxRes = "+"; } - int[][] profile = (int[][]) hconsensus[i].get(AAFrequency.PROFILE); + int[][] profile = (int[][]) hci.get(AAFrequency.PROFILE); if (profile != null && includeAllConsSymbols) { mouseOver = ""; @@ -252,12 +288,10 @@ public class AAFrequency { for (int c = 0; c < alphabet.length; c++) { - tval = ((float) profile[0][alphabet[c]]) - * 100f - / (float) profile[1][ignoreGapsInConsensusCalculation ? 1 - : 0]; + tval = profile[0][alphabet[c]] * 100f + / profile[1][ignoreGapsInConsensusCalculation ? 1 : 0]; mouseOver += ((c == 0) ? "" : "; ") + alphabet[c] + " " - + ((int) tval) + "%"; + + ((fmt!=null) ? fmt.form(tval) : ((int) tval)) + "%"; } } else @@ -268,7 +302,7 @@ public class AAFrequency { ca[c] = new char[] { (char) c }; - vl[c] = (float) profile[0][c]; + vl[c] = profile[0][c]; } ; jalview.util.QuickSort.sort(vl, ca); @@ -276,12 +310,11 @@ public class AAFrequency { if (((char[]) ca[c])[0] != '-') { - tval = ((float) profile[0][((char[]) ca[c])[0]]) + tval = profile[0][((char[]) ca[c])[0]] * 100f - / (float) profile[1][ignoreGapsInConsensusCalculation ? 1 - : 0]; + / profile[1][ignoreGapsInConsensusCalculation ? 1 : 0]; mouseOver += ((p == 0) ? "" : "; ") + ((char[]) ca[c])[0] - + " " + ((int) tval) + "%"; + + " " + ((fmt!=null) ? fmt.form(tval) : ((int) tval)) + "%"; p++; } @@ -291,7 +324,7 @@ public class AAFrequency } else { - mouseOver += ((int) value + "%"); + mouseOver += ((fmt!=null) ? fmt.form(value) : ((int) value)) + "%"; } consensus.annotations[i] = new Annotation(maxRes, mouseOver, ' ', value); @@ -317,20 +350,20 @@ public class AAFrequency { ca[c] = new char[] { (char) c }; - vl[c] = (float) profile[0][c]; + vl[c] = profile[0][c]; } ; jalview.util.QuickSort.sort(vl, ca); rtnval[0] = 2; - rtnval[1]=0; + rtnval[1] = 0; for (int c = ca.length - 1; profile[0][((char[]) ca[c])[0]] > 0; c--) { if (((char[]) ca[c])[0] != '-') { rtnval[rtnval[0]++] = ((char[]) ca[c])[0]; - rtnval[rtnval[0]] = (int) (((float) profile[0][((char[]) ca[c])[0]]) * 100f / (float) profile[1][ignoreGapsInConsensusCalculation ? 1 + rtnval[rtnval[0]] = (int) (profile[0][((char[]) ca[c])[0]] * 100f / profile[1][ignoreGapsInConsensusCalculation ? 1 : 0]); - rtnval[1]+=rtnval[rtnval[0]++]; + rtnval[1] += rtnval[rtnval[0]++]; } } return rtnval;