2 * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
3 * Copyright (C) $$Year-Rel$$ The Jalview Authors
5 * This file is part of Jalview.
7 * Jalview is free software: you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation, either version 3
10 * of the License, or (at your option) any later version.
12 * Jalview is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty
14 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
15 * PURPOSE. See the GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Jalview. If not, see <http://www.gnu.org/licenses/>.
19 * The Jalview Authors are detailed in the 'AUTHORS' file.
21 package jalview.datamodel;
23 import java.util.List;
25 public class CigarArray extends CigarBase
28 * Do CIGAR operations on a set of sequences from many other cigars BAD THINGS
29 * WILL HAPPEN IF A CIGARARRAY IS PASSED TO A CIGARARRAY or a CIGARCIGAR is
30 * given a CIGARARRAY to insert gaps into.
33 * array of subject cigars
35 public CigarSimple refCigars[] = null;
37 private boolean seqcigararray = false;
47 * @return boolean true if all refCigars resolve to a SeqCigar or a CigarCigar
49 public boolean isSeqCigarArray()
55 * Apply CIGAR operations to several cigars in parallel will throw an error if
56 * any of cigar are actually CigarArrays.
61 public CigarArray(CigarSimple[] cigars)
65 if (cigars != null && cigars.length > 0)
67 refCigars = new CigarSimple[cigars.length];
68 for (int c = 0; c < cigars.length; c++)
70 refCigars[c] = cigars[c];
71 if (!((cigars[c] instanceof SeqCigar)
72 || cigars[c] instanceof CigarCigar))
74 seqcigararray = false;
81 * construct a cigar array from the current alignment, or just the subset of
82 * the current alignment specified by selectionGroup. Any columns marked as
83 * hidden in columnSelection will be marked as deleted in the array.
86 * @param columnSelection
87 * @param selectionGroup
89 public CigarArray(AlignmentI alignment, HiddenColumns hidden,
90 SequenceGroup selectionGroup)
92 this(constructSeqCigarArray(alignment, selectionGroup));
93 constructFromAlignment(alignment,
94 hidden != null ? hidden.getHiddenColumnsCopy() : null,
98 private static int[] _calcStartEndBounds(AlignmentI alignment,
99 SequenceGroup selectionGroup)
101 int[] startend = new int[] { 0, 0, 0 };
102 if (selectionGroup != null)
104 startend[0] = selectionGroup.getSize();
105 startend[1] = selectionGroup.getStartRes();
106 startend[2] = selectionGroup.getEndRes(); // inclusive for start and end
108 // SeqCigar constructor
112 startend[0] = alignment.getHeight();
113 startend[2] = alignment.getWidth() - 1;
118 public static SeqCigar[] constructSeqCigarArray(AlignmentI alignment,
119 SequenceGroup selectionGroup)
121 SequenceI[] seqs = null;
123 int _startend[] = _calcStartEndBounds(alignment, selectionGroup);
124 int start = _startend[1], end = _startend[2];
125 if (selectionGroup != null)
127 iSize = selectionGroup.getSize();
128 seqs = selectionGroup.getSequencesInOrder(alignment);
129 start = selectionGroup.getStartRes();
130 end = selectionGroup.getEndRes(); // inclusive for start and end in
131 // SeqCigar constructor
135 iSize = alignment.getHeight();
136 seqs = alignment.getSequencesArray();
137 end = alignment.getWidth() - 1;
139 SeqCigar[] selseqs = new SeqCigar[iSize];
140 for (i = 0; i < iSize; i++)
142 selseqs[i] = new SeqCigar(seqs[i], start, end);
148 * internal constructor function - called by CigarArray(AlignmentI, ...);
152 * - vector of visible regions as returned from
153 * columnSelection.getHiddenColumns()
154 * @param selectionGroup
156 private void constructFromAlignment(AlignmentI alignment,
157 List<int[]> list, SequenceGroup selectionGroup)
159 int[] _startend = _calcStartEndBounds(alignment, selectionGroup);
160 int start = _startend[1], end = _startend[2];
161 // now construct the CigarArray operations
165 int hideStart, hideEnd;
167 for (int j = 0; last < end & j < list.size(); j++)
169 region = list.get(j);
170 hideStart = region[0];
172 // edit hidden regions to selection range
174 // just move on if hideEnd is before last
179 // exit if next region is after end
185 // truncate region at start if last falls in region
186 if ((hideStart < last) && (hideEnd >= last))
191 // truncate region at end if end falls in region
192 if (hideEnd > end) // already checked that hideStart<=end
200 if (last < hideStart)
202 addOperation(CigarArray.M, hideStart - last);
204 addOperation(CigarArray.D, 1 + hideEnd - hideStart);
207 // Final match if necessary.
210 addOperation(CigarArray.M, end - last + 1);
215 addOperation(CigarArray.M, end - start + 1);
220 * @see CigarBase.getSequenceAndDeletions
225 protected Object[][] getArrayofSequenceAndDeletions(char GapChar)
227 if (refCigars == null || refCigars.length == 0 || length == 0)
231 Object[][] sqanddels = new Object[refCigars.length][];
232 for (int c = 0; c < refCigars.length; c++)
234 String refString = refCigars[c].getSequenceString(GapChar);
235 if (refString != null)
237 sqanddels[c] = getSequenceAndDeletions(refString, GapChar);
248 * NOTE: this is an improper sequence string function
250 * @return String formed by newline concatenated results of applying CIGAR
251 * operations to each reference object in turn.
254 * @return '\n' separated strings (empty results included as \n\n)
256 public String getSequenceString(char GapChar)
258 if (length == 0 || refCigars == null)
262 StringBuffer seqStrings = new StringBuffer();
263 Object[][] sqanddels = getArrayofSequenceAndDeletions(GapChar);
264 for (int c = 0; c < refCigars.length; c++)
266 if (sqanddels[c] != null)
268 seqStrings.append((String) sqanddels[c][0]);
269 sqanddels[c][0] = null;
271 seqStrings.append('\n');
273 return seqStrings.toString();
277 * return string results of applying cigar string to all reference cigars
283 public String[] getSequenceStrings(char GapChar)
286 if (length == 0 || refCigars == null || refCigars.length == 0)
290 Object[][] sqanddels = getArrayofSequenceAndDeletions(GapChar);
291 String[] seqs = new String[sqanddels.length];
292 for (int c = 0; c < refCigars.length; c++)
294 seqs[c] = (String) sqanddels[c][0];
300 * Combines the CigarArray cigar operations with the operations in each
301 * reference cigar - creating a new reference cigar
305 * public CigarBase[] getEditedCigars() {
307 * return new CigarBase[] {}; }
310 * applyDeletions edits underlying refCigars to propagate deleted regions, and
311 * removes deletion operations from CigarArray operation list.
313 * @return int[] position after deletion occured and range of deletion in
314 * cigarArray or null if none occured
316 public int[] applyDeletions()
318 java.util.Vector delpos = null;
323 int cursor = 0; // range counter for deletions
324 int vcursor = 0; // visible column index
325 int offset = 0; // shift in visible column index as deletions are made
329 if (operation[i] != D)
331 if (operation[i] == M)
335 vcursor += range[i++];
341 delpos = new java.util.Vector();
343 int delstart = cursor, delend = cursor + range[i] - 1; // inclusive
344 delpos.addElement(new int[] { vcursor + offset, range[i] }); // index of
349 // hidden region boundary
350 offset += range[i] - 1; // shift in visible column coordinates
351 System.arraycopy(operation, i + 1, operation, i, length - i);
352 System.arraycopy(range, i + 1, range, i, length - i);
355 * int dmax=0; for (int s=0; s<refCigars.length; s++) { int d =
356 * refCigars[s].deleteRange(delstart, delend); if (d>dmax) dmax=d; }
357 * offset+=dmax; // shift in visible column coordinates
359 for (int s = 0; s < refCigars.length; s++)
361 int d = refCigars[s].deleteRange(delstart, delend);
368 int[] pos = new int[delpos.size() * 2];
369 for (int k = 0, l = delpos.size(); k < l; k++)
371 int[] dr = ((int[]) delpos.elementAt(k));
373 pos[k * 2 + 1] = dr[1];
374 delpos.setElementAt(null, k);
384 * @return SeqCigar[] or null if CigarArray is not a SeqCigarArray (ie it does
385 * not resolve to set of seqCigars)
387 public SeqCigar[] getSeqCigarArray()
389 if (!isSeqCigarArray())
393 SeqCigar[] sa = new SeqCigar[refCigars.length];
394 for (int i = 0; i < refCigars.length; i++)
396 sa[i] = (SeqCigar) refCigars[i];