src/jalview/datamodel/Sequence.java

   1 /*
   2  * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
   3  * Copyright (C) $$Year-Rel$$ The Jalview Authors
   4  *
   5  * This file is part of Jalview.
   6  *
   7  * Jalview is free software: you can redistribute it and/or
   8  * modify it under the terms of the GNU General Public License
   9  * as published by the Free Software Foundation, either version 3
  10  * of the License, or (at your option) any later version.
  11  *
  12  * Jalview is distributed in the hope that it will be useful, but
  13  * WITHOUT ANY WARRANTY; without even the implied warranty
  14  * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
  15  * PURPOSE.  See the GNU General Public License for more details.
  16  *
  17  * You should have received a copy of the GNU General Public License
  18  * along with Jalview.  If not, see <http://www.gnu.org/licenses/>.
  19  * The Jalview Authors are detailed in the 'AUTHORS' file.
  20  */
  21 package jalview.datamodel;
  22
  23 import jalview.analysis.AlignSeq;
  24 import jalview.api.DBRefEntryI;
  25 import jalview.datamodel.features.SequenceFeatures;
  26 import jalview.datamodel.features.SequenceFeaturesI;
  27 import jalview.util.Comparison;
  28 import jalview.util.DBRefUtils;
  29 import jalview.util.MapList;
  30 import jalview.util.StringUtils;
  31
  32 import java.util.ArrayList;
  33 import java.util.Arrays;
  34 import java.util.BitSet;
  35 import java.util.Collections;
  36 import java.util.Enumeration;
  37 import java.util.List;
  38 import java.util.ListIterator;
  39 import java.util.Vector;
  40
  41 import com.stevesoft.pat.Regex;
  42
  43 import fr.orsay.lri.varna.models.rna.RNA;
  44
  45 /**
  46  *
  47  * Implements the SequenceI interface for a char[] based sequence object.
  48  *
  49  * @author $author$
  50  * @version $Revision$
  51  */
  52 public class Sequence extends ASequence implements SequenceI
  53 {
  54   private static final Regex limitrx = new Regex(
  55           "[/][0-9]{1,}[-][0-9]{1,}$");
  56
  57   private static final Regex endrx = new Regex("[0-9]{1,}$");
  58
  59   SequenceI datasetSequence;
  60
  61   String name;
  62
  63   private char[] sequence;
  64
  65   String description;
  66
  67   int start;
  68
  69   int end;
  70
  71   Vector<PDBEntry> pdbIds;
  72
  73   String vamsasId;
  74
  75   DBRefEntry[] dbrefs;
  76
  77   RNA rna;
  78
  79   /**
  80    * This annotation is displayed below the alignment but the positions are tied
  81    * to the residues of this sequence
  82    *
  83    * TODO: change to List<>
  84    */
  85   Vector<AlignmentAnnotation> annotation;
  86
  87   /**
  88    * The index of the sequence in a MSA
  89    */
  90   int index = -1;
  91
  92   private SequenceFeatures sequenceFeatureStore;
  93
  94   /*
  95    * A cursor holding the approximate current view position to the sequence,
  96    * as determined by findIndex or findPosition or findPositions.
  97    * Using a cursor as a hint allows these methods to be more performant for
  98    * large sequences.
  99    */
 100   private SequenceCursor cursor;
 101
 102   /*
 103    * A number that should be incremented whenever the sequence is edited.
 104    * If the value matches the cursor token, then we can trust the cursor,
 105    * if not then it should be recomputed.
 106    */
 107   private int changeCount;
 108
 109   /**
 110    * Creates a new Sequence object.
 111    *
 112    * @param name
 113    *          display name string
 114    * @param sequence
 115    *          string to form a possibly gapped sequence out of
 116    * @param start
 117    *          first position of non-gap residue in the sequence
 118    * @param end
 119    *          last position of ungapped residues (nearly always only used for
 120    *          display purposes)
 121    */
 122   public Sequence(String name, String sequence, int start, int end)
 123   {
 124     this();
 125     initSeqAndName(name, sequence.toCharArray(), start, end);
 126   }
 127
 128   public Sequence(String name, char[] sequence, int start, int end)
 129   {
 130     this();
 131     initSeqAndName(name, sequence, start, end);
 132   }
 133
 134   /**
 135    * Stage 1 constructor - assign name, sequence, and set start and end fields.
 136    * start and end are updated values from name2 if it ends with /start-end
 137    *
 138    * @param name2
 139    * @param sequence2
 140    * @param start2
 141    * @param end2
 142    */
 143   protected void initSeqAndName(String name2, char[] sequence2, int start2,
 144           int end2)
 145   {
 146     this.name = name2;
 147     this.sequence = sequence2;
 148     this.start = start2;
 149     this.end = end2;
 150     parseId();
 151     checkValidRange();
 152   }
 153
 154   void parseId()
 155   {
 156     if (name == null)
 157     {
 158       System.err
 159               .println("POSSIBLE IMPLEMENTATION ERROR: null sequence name passed to constructor.");
 160       name = "";
 161     }
 162     // Does sequence have the /start-end signature?
 163     if (limitrx.search(name))
 164     {
 165       name = limitrx.left();
 166       endrx.search(limitrx.stringMatched());
 167       setStart(Integer.parseInt(limitrx.stringMatched().substring(1,
 168               endrx.matchedFrom() - 1)));
 169       setEnd(Integer.parseInt(endrx.stringMatched()));
 170     }
 171   }
 172
 173   void checkValidRange()
 174   {
 175     // Note: JAL-774 :
 176     // http://issues.jalview.org/browse/JAL-774?focusedCommentId=11239&page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel#comment-11239
 177     {
 178       int endRes = 0;
 179       for (int j = 0; j < sequence.length; j++)
 180       {
 181         if (!jalview.util.Comparison.isGap(sequence[j]))
 182         {
 183           endRes++;
 184         }
 185       }
 186       if (endRes > 0)
 187       {
 188         endRes += start - 1;
 189       }
 190
 191       if (end < endRes)
 192       {
 193         end = endRes;
 194       }
 195     }
 196
 197   }
 198
 199   /**
 200    * default constructor
 201    */
 202   private Sequence()
 203   {
 204     sequenceFeatureStore = new SequenceFeatures();
 205   }
 206
 207   /**
 208    * Creates a new Sequence object.
 209    *
 210    * @param name
 211    *          DOCUMENT ME!
 212    * @param sequence
 213    *          DOCUMENT ME!
 214    */
 215   public Sequence(String name, String sequence)
 216   {
 217     this(name, sequence, 1, -1);
 218   }
 219
 220   /**
 221    * Creates a new Sequence object with new AlignmentAnnotations but inherits
 222    * any existing dataset sequence reference. If non exists, everything is
 223    * copied.
 224    *
 225    * @param seq
 226    *          if seq is a dataset sequence, behaves like a plain old copy
 227    *          constructor
 228    */
 229   public Sequence(SequenceI seq)
 230   {
 231     this(seq, seq.getAnnotation());
 232   }
 233
 234   /**
 235    * Create a new sequence object with new features, DBRefEntries, and PDBIds
 236    * but inherits any existing dataset sequence reference, and duplicate of any
 237    * annotation that is present in the given annotation array.
 238    *
 239    * @param seq
 240    *          the sequence to be copied
 241    * @param alAnnotation
 242    *          an array of annotation including some associated with seq
 243    */
 244   public Sequence(SequenceI seq, AlignmentAnnotation[] alAnnotation)
 245   {
 246     this();
 247     initSeqFrom(seq, alAnnotation);
 248   }
 249
 250   /**
 251    * does the heavy lifting when cloning a dataset sequence, or coping data from
 252    * dataset to a new derived sequence.
 253    *
 254    * @param seq
 255    *          - source of attributes.
 256    * @param alAnnotation
 257    *          - alignment annotation present on seq that should be copied onto
 258    *          this sequence
 259    */
 260   protected void initSeqFrom(SequenceI seq,
 261           AlignmentAnnotation[] alAnnotation)
 262   {
 263     char[] oseq = seq.getSequence(); // returns a copy of the array
 264     initSeqAndName(seq.getName(), oseq, seq.getStart(), seq.getEnd());
 265
 266     description = seq.getDescription();
 267     if (seq != datasetSequence)
 268     {
 269       setDatasetSequence(seq.getDatasetSequence());
 270     }
 271
 272     /*
 273      * only copy DBRefs and seqfeatures if we really are a dataset sequence
 274      */
 275     if (datasetSequence == null)
 276     {
 277       if (seq.getDBRefs() != null)
 278       {
 279         DBRefEntry[] dbr = seq.getDBRefs();
 280         for (int i = 0; i < dbr.length; i++)
 281         {
 282           addDBRef(new DBRefEntry(dbr[i]));
 283         }
 284       }
 285
 286       /*
 287        * make copies of any sequence features
 288        */
 289       for (SequenceFeature sf : seq.getSequenceFeatures())
 290       {
 291         addSequenceFeature(new SequenceFeature(sf));
 292       }
 293     }
 294
 295     if (seq.getAnnotation() != null)
 296     {
 297       AlignmentAnnotation[] sqann = seq.getAnnotation();
 298       for (int i = 0; i < sqann.length; i++)
 299       {
 300         if (sqann[i] == null)
 301         {
 302           continue;
 303         }
 304         boolean found = (alAnnotation == null);
 305         if (!found)
 306         {
 307           for (int apos = 0; !found && apos < alAnnotation.length; apos++)
 308           {
 309             found = (alAnnotation[apos] == sqann[i]);
 310           }
 311         }
 312         if (found)
 313         {
 314           // only copy the given annotation
 315           AlignmentAnnotation newann = new AlignmentAnnotation(sqann[i]);
 316           addAlignmentAnnotation(newann);
 317         }
 318       }
 319     }
 320     if (seq.getAllPDBEntries() != null)
 321     {
 322       Vector<PDBEntry> ids = seq.getAllPDBEntries();
 323       for (PDBEntry pdb : ids)
 324       {
 325         this.addPDBId(new PDBEntry(pdb));
 326       }
 327     }
 328   }
 329
 330   @Override
 331   public void setSequenceFeatures(List<SequenceFeature> features)
 332   {
 333     if (datasetSequence != null)
 334     {
 335       datasetSequence.setSequenceFeatures(features);
 336       return;
 337     }
 338     sequenceFeatureStore = new SequenceFeatures(features);
 339   }
 340
 341   @Override
 342   public synchronized boolean addSequenceFeature(SequenceFeature sf)
 343   {
 344     if (sf.getType() == null)
 345     {
 346       System.err.println("SequenceFeature type may not be null: "
 347               + sf.toString());
 348       return false;
 349     }
 350
 351     if (datasetSequence != null)
 352     {
 353       return datasetSequence.addSequenceFeature(sf);
 354     }
 355
 356     return sequenceFeatureStore.add(sf);
 357   }
 358
 359   @Override
 360   public void deleteFeature(SequenceFeature sf)
 361   {
 362     if (datasetSequence != null)
 363     {
 364       datasetSequence.deleteFeature(sf);
 365     }
 366     else
 367     {
 368       sequenceFeatureStore.delete(sf);
 369     }
 370   }
 371
 372   /**
 373    * {@inheritDoc}
 374    *
 375    * @return
 376    */
 377   @Override
 378   public List<SequenceFeature> getSequenceFeatures()
 379   {
 380     if (datasetSequence != null)
 381     {
 382       return datasetSequence.getSequenceFeatures();
 383     }
 384     return sequenceFeatureStore.getAllFeatures();
 385   }
 386
 387   @Override
 388   public SequenceFeaturesI getFeatures()
 389   {
 390     return datasetSequence != null ? datasetSequence.getFeatures()
 391             : sequenceFeatureStore;
 392   }
 393
 394   @Override
 395   public boolean addPDBId(PDBEntry entry)
 396   {
 397     if (pdbIds == null)
 398     {
 399       pdbIds = new Vector<PDBEntry>();
 400       pdbIds.add(entry);
 401       return true;
 402     }
 403
 404     for (PDBEntry pdbe : pdbIds)
 405     {
 406       if (pdbe.updateFrom(entry))
 407       {
 408         return false;
 409       }
 410     }
 411     pdbIds.addElement(entry);
 412     return true;
 413   }
 414
 415   /**
 416    * DOCUMENT ME!
 417    *
 418    * @param id
 419    *          DOCUMENT ME!
 420    */
 421   @Override
 422   public void setPDBId(Vector<PDBEntry> id)
 423   {
 424     pdbIds = id;
 425   }
 426
 427   /**
 428    * DOCUMENT ME!
 429    *
 430    * @return DOCUMENT ME!
 431    */
 432   @Override
 433   public Vector<PDBEntry> getAllPDBEntries()
 434   {
 435     return pdbIds == null ? new Vector<PDBEntry>() : pdbIds;
 436   }
 437
 438   /**
 439    * DOCUMENT ME!
 440    *
 441    * @return DOCUMENT ME!
 442    */
 443   @Override
 444   public String getDisplayId(boolean jvsuffix)
 445   {
 446     StringBuffer result = new StringBuffer(name);
 447     if (jvsuffix)
 448     {
 449       result.append("/" + start + "-" + end);
 450     }
 451
 452     return result.toString();
 453   }
 454
 455   /**
 456    * DOCUMENT ME!
 457    *
 458    * @param name
 459    *          DOCUMENT ME!
 460    */
 461   @Override
 462   public void setName(String name)
 463   {
 464     this.name = name;
 465     this.parseId();
 466   }
 467
 468   /**
 469    * DOCUMENT ME!
 470    *
 471    * @return DOCUMENT ME!
 472    */
 473   @Override
 474   public String getName()
 475   {
 476     return this.name;
 477   }
 478
 479   /**
 480    * DOCUMENT ME!
 481    *
 482    * @param start
 483    *          DOCUMENT ME!
 484    */
 485   @Override
 486   public void setStart(int start)
 487   {
 488     this.start = start;
 489   }
 490
 491   /**
 492    * DOCUMENT ME!
 493    *
 494    * @return DOCUMENT ME!
 495    */
 496   @Override
 497   public int getStart()
 498   {
 499     return this.start;
 500   }
 501
 502   /**
 503    * DOCUMENT ME!
 504    *
 505    * @param end
 506    *          DOCUMENT ME!
 507    */
 508   @Override
 509   public void setEnd(int end)
 510   {
 511     this.end = end;
 512   }
 513
 514   /**
 515    * DOCUMENT ME!
 516    *
 517    * @return DOCUMENT ME!
 518    */
 519   @Override
 520   public int getEnd()
 521   {
 522     return this.end;
 523   }
 524
 525   /**
 526    * DOCUMENT ME!
 527    *
 528    * @return DOCUMENT ME!
 529    */
 530   @Override
 531   public int getLength()
 532   {
 533     return this.sequence.length;
 534   }
 535
 536   /**
 537    * DOCUMENT ME!
 538    *
 539    * @param seq
 540    *          DOCUMENT ME!
 541    */
 542   @Override
 543   public void setSequence(String seq)
 544   {
 545     this.sequence = seq.toCharArray();
 546     checkValidRange();
 547     sequenceChanged();
 548   }
 549
 550   @Override
 551   public String getSequenceAsString()
 552   {
 553     return new String(sequence);
 554   }
 555
 556   @Override
 557   public String getSequenceAsString(int start, int end)
 558   {
 559     return new String(getSequence(start, end));
 560   }
 561
 562   @Override
 563   public char[] getSequence()
 564   {
 565     // return sequence;
 566     return sequence == null ? null : Arrays.copyOf(sequence,
 567             sequence.length);
 568   }
 569
 570   /*
 571    * (non-Javadoc)
 572    *
 573    * @see jalview.datamodel.SequenceI#getSequence(int, int)
 574    */
 575   @Override
 576   public char[] getSequence(int start, int end)
 577   {
 578     if (start < 0)
 579     {
 580       start = 0;
 581     }
 582     // JBPNote - left to user to pad the result here (TODO:Decide on this
 583     // policy)
 584     if (start >= sequence.length)
 585     {
 586       return new char[0];
 587     }
 588
 589     if (end >= sequence.length)
 590     {
 591       end = sequence.length;
 592     }
 593
 594     char[] reply = new char[end - start];
 595     System.arraycopy(sequence, start, reply, 0, end - start);
 596
 597     return reply;
 598   }
 599
 600   @Override
 601   public SequenceI getSubSequence(int start, int end)
 602   {
 603     if (start < 0)
 604     {
 605       start = 0;
 606     }
 607     char[] seq = getSequence(start, end);
 608     if (seq.length == 0)
 609     {
 610       return null;
 611     }
 612     int nstart = findPosition(start);
 613     int nend = findPosition(end) - 1;
 614     // JBPNote - this is an incomplete copy.
 615     SequenceI nseq = new Sequence(this.getName(), seq, nstart, nend);
 616     nseq.setDescription(description);
 617     if (datasetSequence != null)
 618     {
 619       nseq.setDatasetSequence(datasetSequence);
 620     }
 621     else
 622     {
 623       nseq.setDatasetSequence(this);
 624     }
 625     return nseq;
 626   }
 627
 628   /**
 629    * Returns the character of the aligned sequence at the given position (base
 630    * zero), or space if the position is not within the sequence's bounds
 631    *
 632    * @return
 633    */
 634   @Override
 635   public char getCharAt(int i)
 636   {
 637     if (i >= 0 && i < sequence.length)
 638     {
 639       return sequence[i];
 640     }
 641     else
 642     {
 643       return ' ';
 644     }
 645   }
 646
 647   /**
 648    * DOCUMENT ME!
 649    *
 650    * @param desc
 651    *          DOCUMENT ME!
 652    */
 653   @Override
 654   public void setDescription(String desc)
 655   {
 656     this.description = desc;
 657   }
 658
 659   /**
 660    * DOCUMENT ME!
 661    *
 662    * @return DOCUMENT ME!
 663    */
 664   @Override
 665   public String getDescription()
 666   {
 667     return this.description;
 668   }
 669
 670   /**
 671    * {@inheritDoc}
 672    */
 673   @Override
 674   public int findIndex(int pos)
 675   {
 676     /*
 677      * use a valid, hopefully nearby, cursor if available
 678      */
 679     if (isValidCursor(cursor))
 680     {
 681       return findIndex(pos, cursor);
 682     }
 683
 684     int j = start;
 685     int i = 0;
 686     int startColumn = 0;
 687
 688     /*
 689      * traverse sequence from the start counting gaps; make a note of
 690      * the column of the first residue to save in the cursor
 691      */
 692     while ((i < sequence.length) && (j <= end) && (j <= pos))
 693     {
 694       if (!Comparison.isGap(sequence[i]))
 695       {
 696         if (j == start)
 697         {
 698           startColumn = i;
 699         }
 700         j++;
 701       }
 702       i++;
 703     }
 704
 705     if (j == end && j < pos)
 706     {
 707       return end + 1;
 708     }
 709
 710     updateCursor(pos, i, startColumn);
 711     return i;
 712   }
 713
 714   /**
 715    * Updates the cursor to the latest found residue and column position
 716    *
 717    * @param residuePos
 718    *          (start..)
 719    * @param column
 720    *          (1..)
 721    * @param startColumn
 722    *          column position of the first sequence residue
 723    */
 724   protected void updateCursor(int residuePos, int column, int startColumn)
 725   {
 726     /*
 727      * preserve end residue column provided cursor was valid
 728      */
 729     int endColumn = isValidCursor(cursor) ? cursor.lastColumnPosition : 0;
 730     if (residuePos == this.end)
 731     {
 732       endColumn = column;
 733     }
 734
 735     cursor = new SequenceCursor(this, residuePos, column, startColumn,
 736             endColumn, this.changeCount);
 737   }
 738
 739   /**
 740    * Answers the aligned column position (1..) for the given residue position
 741    * (start..) given a 'hint' of a residue/column location in the neighbourhood.
 742    * The hint may be left of, at, or to the right of the required position.
 743    *
 744    * @param pos
 745    * @param curs
 746    * @return
 747    */
 748   protected int findIndex(int pos, SequenceCursor curs)
 749   {
 750     if (!isValidCursor(curs))
 751     {
 752       /*
 753        * wrong or invalidated cursor, compute de novo
 754        */
 755       return findIndex(pos);
 756     }
 757
 758     if (curs.residuePosition == pos)
 759     {
 760       return curs.columnPosition;
 761     }
 762
 763     /*
 764      * move left or right to find pos from hint.position
 765      */
 766     int col = curs.columnPosition - 1; // convert from base 1 to 0-based array
 767                                        // index
 768     int newPos = curs.residuePosition;
 769     int delta = newPos > pos ? -1 : 1;
 770
 771     while (newPos != pos)
 772     {
 773       col += delta; // shift one column left or right
 774       if (col < 0 || col == sequence.length)
 775       {
 776         break;
 777       }
 778       if (!Comparison.isGap(sequence[col]))
 779       {
 780         newPos += delta;
 781       }
 782     }
 783
 784     col++; // convert back to base 1
 785     updateCursor(pos, col, curs.firstColumnPosition);
 786
 787     return col;
 788   }
 789
 790   /**
 791    * {@inheritDoc}
 792    */
 793   @Override
 794   public int findPosition(final int column)
 795   {
 796     /*
 797      * use a valid, hopefully nearby, cursor if available
 798      */
 799     if (isValidCursor(cursor))
 800     {
 801       return findPosition(column + 1, cursor);
 802     }
 803
 804     // TODO recode this more naturally i.e. count residues only
 805     // as they are found, not 'in anticipation'
 806
 807     /*
 808      * traverse the sequence counting gaps; note the column position
 809      * of the first residue, to save in the cursor
 810      */
 811     int firstResidueColumn = 0;
 812     int lastPosFound = 0;
 813     int lastPosFoundColumn = 0;
 814     int seqlen = sequence.length;
 815
 816     if (seqlen > 0 && !Comparison.isGap(sequence[0]))
 817     {
 818       lastPosFound = start;
 819       lastPosFoundColumn = 0;
 820     }
 821
 822     int j = 0;
 823     int pos = start;
 824
 825     while (j < column && j < seqlen)
 826     {
 827       if (!Comparison.isGap(sequence[j]))
 828       {
 829         lastPosFound = pos;
 830         lastPosFoundColumn = j;
 831         if (pos == this.start)
 832         {
 833           firstResidueColumn = j;
 834         }
 835         pos++;
 836       }
 837       j++;
 838     }
 839     if (j < seqlen && !Comparison.isGap(sequence[j]))
 840     {
 841       lastPosFound = pos;
 842       lastPosFoundColumn = j;
 843       if (pos == this.start)
 844       {
 845         firstResidueColumn = j;
 846       }
 847     }
 848
 849     /*
 850      * update the cursor to the last residue position found (if any)
 851      * (converting column position to base 1)
 852      */
 853     if (lastPosFound != 0)
 854     {
 855       updateCursor(lastPosFound, lastPosFoundColumn + 1,
 856               firstResidueColumn + 1);
 857     }
 858
 859     return pos;
 860   }
 861
 862   /**
 863    * Answers true if the given cursor is not null, is for this sequence object,
 864    * and has a token value that matches this object's changeCount, else false.
 865    * This allows us to ignore a cursor as 'stale' if the sequence has been
 866    * modified since the cursor was created.
 867    *
 868    * @param curs
 869    * @return
 870    */
 871   protected boolean isValidCursor(SequenceCursor curs)
 872   {
 873     if (curs == null || curs.sequence != this || curs.token != changeCount)
 874     {
 875       return false;
 876     }
 877     /*
 878      * sanity check against range
 879      */
 880     if (curs.columnPosition < 0 || curs.columnPosition > sequence.length)
 881     {
 882       return false;
 883     }
 884     if (curs.residuePosition < start || curs.residuePosition > end)
 885     {
 886       return false;
 887     }
 888     return true;
 889   }
 890
 891   /**
 892    * Answers the sequence position (start..) for the given aligned column
 893    * position (1..), given a hint of a cursor in the neighbourhood. The cursor
 894    * may lie left of, at, or to the right of the column position.
 895    *
 896    * @param col
 897    * @param curs
 898    * @return
 899    */
 900   protected int findPosition(final int col, SequenceCursor curs)
 901   {
 902     if (!isValidCursor(curs))
 903     {
 904       /*
 905        * wrong or invalidated cursor, compute de novo
 906        */
 907       return findPosition(col - 1);// ugh back to base 0
 908     }
 909
 910     if (curs.columnPosition == col)
 911     {
 912       cursor = curs; // in case this method becomes public
 913       return curs.residuePosition; // easy case :-)
 914     }
 915
 916     if (curs.lastColumnPosition > 0 && curs.lastColumnPosition < col)
 917     {
 918       /*
 919        * sequence lies entirely to the left of col
 920        * - return last residue + 1
 921        */
 922       return end + 1;
 923     }
 924
 925     if (curs.firstColumnPosition > 0 && curs.firstColumnPosition > col)
 926     {
 927       /*
 928        * sequence lies entirely to the right of col
 929        * - return first residue
 930        */
 931       return start;
 932     }
 933
 934     // todo could choose closest to col out of column,
 935     // firstColumnPosition, lastColumnPosition as a start point
 936
 937     /*
 938      * move left or right to find pos from cursor position
 939      */
 940     int firstResidueColumn = curs.firstColumnPosition;
 941     int column = curs.columnPosition - 1; // to base 0
 942     int newPos = curs.residuePosition;
 943     int delta = curs.columnPosition > col ? -1 : 1;
 944     boolean gapped = false;
 945     int lastFoundPosition = curs.residuePosition;
 946     int lastFoundPositionColumn = curs.columnPosition;
 947
 948     while (column != col - 1)
 949     {
 950       column += delta; // shift one column left or right
 951       if (column < 0 || column == sequence.length)
 952       {
 953         break;
 954       }
 955       gapped = Comparison.isGap(sequence[column]);
 956       if (!gapped)
 957       {
 958         newPos += delta;
 959         lastFoundPosition = newPos;
 960         lastFoundPositionColumn = column + 1;
 961         if (lastFoundPosition == this.start)
 962         {
 963           firstResidueColumn = column + 1;
 964         }
 965       }
 966     }
 967
 968     if (cursor == null || lastFoundPosition != cursor.residuePosition)
 969     {
 970       updateCursor(lastFoundPosition, lastFoundPositionColumn,
 971               firstResidueColumn);
 972     }
 973
 974     /*
 975      * hack to give position to the right if on a gap
 976      * or beyond the length of the sequence (see JAL-2562)
 977      */
 978     if (delta > 0 && (gapped || column >= sequence.length))
 979     {
 980       newPos++;
 981     }
 982
 983     return newPos;
 984   }
 985
 986   /**
 987    * Returns an int array where indices correspond to each residue in the
 988    * sequence and the element value gives its position in the alignment
 989    *
 990    * @return int[SequenceI.getEnd()-SequenceI.getStart()+1] or null if no
 991    *         residues in SequenceI object
 992    */
 993   @Override
 994   public int[] gapMap()
 995   {
 996     String seq = jalview.analysis.AlignSeq.extractGaps(
 997             jalview.util.Comparison.GapChars, new String(sequence));
 998     int[] map = new int[seq.length()];
 999     int j = 0;
1000     int p = 0;
1001
1002     while (j < sequence.length)
1003     {
1004       if (!jalview.util.Comparison.isGap(sequence[j]))
1005       {
1006         map[p++] = j;
1007       }
1008
1009       j++;
1010     }
1011
1012     return map;
1013   }
1014
1015   @Override
1016   public int[] findPositionMap()
1017   {
1018     int map[] = new int[sequence.length];
1019     int j = 0;
1020     int pos = start;
1021     int seqlen = sequence.length;
1022     while ((j < seqlen))
1023     {
1024       map[j] = pos;
1025       if (!jalview.util.Comparison.isGap(sequence[j]))
1026       {
1027         pos++;
1028       }
1029
1030       j++;
1031     }
1032     return map;
1033   }
1034
1035   @Override
1036   public List<int[]> getInsertions()
1037   {
1038     ArrayList<int[]> map = new ArrayList<int[]>();
1039     int lastj = -1, j = 0;
1040     int pos = start;
1041     int seqlen = sequence.length;
1042     while ((j < seqlen))
1043     {
1044       if (jalview.util.Comparison.isGap(sequence[j]))
1045       {
1046         if (lastj == -1)
1047         {
1048           lastj = j;
1049         }
1050       }
1051       else
1052       {
1053         if (lastj != -1)
1054         {
1055           map.add(new int[] { lastj, j - 1 });
1056           lastj = -1;
1057         }
1058       }
1059       j++;
1060     }
1061     if (lastj != -1)
1062     {
1063       map.add(new int[] { lastj, j - 1 });
1064       lastj = -1;
1065     }
1066     return map;
1067   }
1068
1069   @Override
1070   public BitSet getInsertionsAsBits()
1071   {
1072     BitSet map = new BitSet();
1073     int lastj = -1, j = 0;
1074     int pos = start;
1075     int seqlen = sequence.length;
1076     while ((j < seqlen))
1077     {
1078       if (jalview.util.Comparison.isGap(sequence[j]))
1079       {
1080         if (lastj == -1)
1081         {
1082           lastj = j;
1083         }
1084       }
1085       else
1086       {
1087         if (lastj != -1)
1088         {
1089           map.set(lastj, j);
1090           lastj = -1;
1091         }
1092       }
1093       j++;
1094     }
1095     if (lastj != -1)
1096     {
1097       map.set(lastj, j);
1098       lastj = -1;
1099     }
1100     return map;
1101   }
1102
1103   @Override
1104   public void deleteChars(int i, int j)
1105   {
1106     int newstart = start, newend = end;
1107     if (i >= sequence.length || i < 0)
1108     {
1109       return;
1110     }
1111
1112     char[] tmp = StringUtils.deleteChars(sequence, i, j);
1113     boolean createNewDs = false;
1114     // TODO: take a (second look) at the dataset creation validation method for
1115     // the very large sequence case
1116     int eindex = -1, sindex = -1;
1117     boolean ecalc = false, scalc = false;
1118     for (int s = i; s < j; s++)
1119     {
1120       if (jalview.schemes.ResidueProperties.aaIndex[sequence[s]] != 23)
1121       {
1122         if (createNewDs)
1123         {
1124           newend--;
1125         }
1126         else
1127         {
1128           if (!scalc)
1129           {
1130             sindex = findIndex(start) - 1;
1131             scalc = true;
1132           }
1133           if (sindex == s)
1134           {
1135             // delete characters including start of sequence
1136             newstart = findPosition(j);
1137             break; // don't need to search for any more residue characters.
1138           }
1139           else
1140           {
1141             // delete characters after start.
1142             if (!ecalc)
1143             {
1144               eindex = findIndex(end) - 1;
1145               ecalc = true;
1146             }
1147             if (eindex < j)
1148             {
1149               // delete characters at end of sequence
1150               newend = findPosition(i - 1);
1151               break; // don't need to search for any more residue characters.
1152             }
1153             else
1154             {
1155               createNewDs = true;
1156               newend--; // decrease end position by one for the deleted residue
1157               // and search further
1158             }
1159           }
1160         }
1161       }
1162     }
1163     // deletion occured in the middle of the sequence
1164     if (createNewDs && this.datasetSequence != null)
1165     {
1166       // construct a new sequence
1167       Sequence ds = new Sequence(datasetSequence);
1168       // TODO: remove any non-inheritable properties ?
1169       // TODO: create a sequence mapping (since there is a relation here ?)
1170       ds.deleteChars(i, j);
1171       datasetSequence = ds;
1172     }
1173     start = newstart;
1174     end = newend;
1175     sequence = tmp;
1176     sequenceChanged();
1177   }
1178
1179   @Override
1180   public void insertCharAt(int i, int length, char c)
1181   {
1182     char[] tmp = new char[sequence.length + length];
1183
1184     if (i >= sequence.length)
1185     {
1186       System.arraycopy(sequence, 0, tmp, 0, sequence.length);
1187       i = sequence.length;
1188     }
1189     else
1190     {
1191       System.arraycopy(sequence, 0, tmp, 0, i);
1192     }
1193
1194     int index = i;
1195     while (length > 0)
1196     {
1197       tmp[index++] = c;
1198       length--;
1199     }
1200
1201     if (i < sequence.length)
1202     {
1203       System.arraycopy(sequence, i, tmp, index, sequence.length - i);
1204     }
1205
1206     sequence = tmp;
1207     sequenceChanged();
1208   }
1209
1210   @Override
1211   public void insertCharAt(int i, char c)
1212   {
1213     insertCharAt(i, 1, c);
1214   }
1215
1216   @Override
1217   public String getVamsasId()
1218   {
1219     return vamsasId;
1220   }
1221
1222   @Override
1223   public void setVamsasId(String id)
1224   {
1225     vamsasId = id;
1226   }
1227
1228   @Override
1229   public void setDBRefs(DBRefEntry[] dbref)
1230   {
1231     if (dbrefs == null && datasetSequence != null
1232             && this != datasetSequence)
1233     {
1234       datasetSequence.setDBRefs(dbref);
1235       return;
1236     }
1237     dbrefs = dbref;
1238     if (dbrefs != null)
1239     {
1240       DBRefUtils.ensurePrimaries(this);
1241     }
1242   }
1243
1244   @Override
1245   public DBRefEntry[] getDBRefs()
1246   {
1247     if (dbrefs == null && datasetSequence != null
1248             && this != datasetSequence)
1249     {
1250       return datasetSequence.getDBRefs();
1251     }
1252     return dbrefs;
1253   }
1254
1255   @Override
1256   public void addDBRef(DBRefEntry entry)
1257   {
1258     if (datasetSequence != null)
1259     {
1260       datasetSequence.addDBRef(entry);
1261       return;
1262     }
1263
1264     if (dbrefs == null)
1265     {
1266       dbrefs = new DBRefEntry[0];
1267     }
1268
1269     for (DBRefEntryI dbr : dbrefs)
1270     {
1271       if (dbr.updateFrom(entry))
1272       {
1273         /*
1274          * found a dbref that either matched, or could be
1275          * updated from, the new entry - no need to add it
1276          */
1277         return;
1278       }
1279     }
1280
1281     /*
1282      * extend the array to make room for one more
1283      */
1284     // TODO use an ArrayList instead
1285     int j = dbrefs.length;
1286     DBRefEntry[] temp = new DBRefEntry[j + 1];
1287     System.arraycopy(dbrefs, 0, temp, 0, j);
1288     temp[temp.length - 1] = entry;
1289
1290     dbrefs = temp;
1291
1292     DBRefUtils.ensurePrimaries(this);
1293   }
1294
1295   @Override
1296   public void setDatasetSequence(SequenceI seq)
1297   {
1298     if (seq == this)
1299     {
1300       throw new IllegalArgumentException(
1301               "Implementation Error: self reference passed to SequenceI.setDatasetSequence");
1302     }
1303     if (seq != null && seq.getDatasetSequence() != null)
1304     {
1305       throw new IllegalArgumentException(
1306               "Implementation error: cascading dataset sequences are not allowed.");
1307     }
1308     datasetSequence = seq;
1309   }
1310
1311   @Override
1312   public SequenceI getDatasetSequence()
1313   {
1314     return datasetSequence;
1315   }
1316
1317   @Override
1318   public AlignmentAnnotation[] getAnnotation()
1319   {
1320     return annotation == null ? null : annotation
1321             .toArray(new AlignmentAnnotation[annotation.size()]);
1322   }
1323
1324   @Override
1325   public boolean hasAnnotation(AlignmentAnnotation ann)
1326   {
1327     return annotation == null ? false : annotation.contains(ann);
1328   }
1329
1330   @Override
1331   public void addAlignmentAnnotation(AlignmentAnnotation annotation)
1332   {
1333     if (this.annotation == null)
1334     {
1335       this.annotation = new Vector<AlignmentAnnotation>();
1336     }
1337     if (!this.annotation.contains(annotation))
1338     {
1339       this.annotation.addElement(annotation);
1340     }
1341     annotation.setSequenceRef(this);
1342   }
1343
1344   @Override
1345   public void removeAlignmentAnnotation(AlignmentAnnotation annotation)
1346   {
1347     if (this.annotation != null)
1348     {
1349       this.annotation.removeElement(annotation);
1350       if (this.annotation.size() == 0)
1351       {
1352         this.annotation = null;
1353       }
1354     }
1355   }
1356
1357   /**
1358    * test if this is a valid candidate for another sequence's dataset sequence.
1359    *
1360    */
1361   private boolean isValidDatasetSequence()
1362   {
1363     if (datasetSequence != null)
1364     {
1365       return false;
1366     }
1367     for (int i = 0; i < sequence.length; i++)
1368     {
1369       if (jalview.util.Comparison.isGap(sequence[i]))
1370       {
1371         return false;
1372       }
1373     }
1374     return true;
1375   }
1376
1377   @Override
1378   public SequenceI deriveSequence()
1379   {
1380     Sequence seq = null;
1381     if (datasetSequence == null)
1382     {
1383       if (isValidDatasetSequence())
1384       {
1385         // Use this as dataset sequence
1386         seq = new Sequence(getName(), "", 1, -1);
1387         seq.setDatasetSequence(this);
1388         seq.initSeqFrom(this, getAnnotation());
1389         return seq;
1390       }
1391       else
1392       {
1393         // Create a new, valid dataset sequence
1394         createDatasetSequence();
1395       }
1396     }
1397     return new Sequence(this);
1398   }
1399
1400   private boolean _isNa;
1401
1402   private int _seqhash = 0;
1403
1404   /**
1405    * Answers false if the sequence is more than 85% nucleotide (ACGTU), else
1406    * true
1407    */
1408   @Override
1409   public boolean isProtein()
1410   {
1411     if (datasetSequence != null)
1412     {
1413       return datasetSequence.isProtein();
1414     }
1415     if (_seqhash != sequence.hashCode())
1416     {
1417       _seqhash = sequence.hashCode();
1418       _isNa = Comparison.isNucleotide(this);
1419     }
1420     return !_isNa;
1421   };
1422
1423   /*
1424    * (non-Javadoc)
1425    *
1426    * @see jalview.datamodel.SequenceI#createDatasetSequence()
1427    */
1428   @Override
1429   public SequenceI createDatasetSequence()
1430   {
1431     if (datasetSequence == null)
1432     {
1433       Sequence dsseq = new Sequence(getName(), AlignSeq.extractGaps(
1434               jalview.util.Comparison.GapChars, getSequenceAsString()),
1435               getStart(), getEnd());
1436
1437       datasetSequence = dsseq;
1438
1439       dsseq.setDescription(description);
1440       // move features and database references onto dataset sequence
1441       dsseq.sequenceFeatureStore = sequenceFeatureStore;
1442       sequenceFeatureStore = null;
1443       dsseq.dbrefs = dbrefs;
1444       dbrefs = null;
1445       // TODO: search and replace any references to this sequence with
1446       // references to the dataset sequence in Mappings on dbref
1447       dsseq.pdbIds = pdbIds;
1448       pdbIds = null;
1449       datasetSequence.updatePDBIds();
1450       if (annotation != null)
1451       {
1452         // annotation is cloned rather than moved, to preserve what's currently
1453         // on the alignment
1454         for (AlignmentAnnotation aa : annotation)
1455         {
1456           AlignmentAnnotation _aa = new AlignmentAnnotation(aa);
1457           _aa.sequenceRef = datasetSequence;
1458           _aa.adjustForAlignment(); // uses annotation's own record of
1459                                     // sequence-column mapping
1460           datasetSequence.addAlignmentAnnotation(_aa);
1461         }
1462       }
1463     }
1464     return datasetSequence;
1465   }
1466
1467   /*
1468    * (non-Javadoc)
1469    *
1470    * @see
1471    * jalview.datamodel.SequenceI#setAlignmentAnnotation(AlignmmentAnnotation[]
1472    * annotations)
1473    */
1474   @Override
1475   public void setAlignmentAnnotation(AlignmentAnnotation[] annotations)
1476   {
1477     if (annotation != null)
1478     {
1479       annotation.removeAllElements();
1480     }
1481     if (annotations != null)
1482     {
1483       for (int i = 0; i < annotations.length; i++)
1484       {
1485         if (annotations[i] != null)
1486         {
1487           addAlignmentAnnotation(annotations[i]);
1488         }
1489       }
1490     }
1491   }
1492
1493   @Override
1494   public AlignmentAnnotation[] getAnnotation(String label)
1495   {
1496     if (annotation == null || annotation.size() == 0)
1497     {
1498       return null;
1499     }
1500
1501     Vector<AlignmentAnnotation> subset = new Vector<AlignmentAnnotation>();
1502     Enumeration<AlignmentAnnotation> e = annotation.elements();
1503     while (e.hasMoreElements())
1504     {
1505       AlignmentAnnotation ann = e.nextElement();
1506       if (ann.label != null && ann.label.equals(label))
1507       {
1508         subset.addElement(ann);
1509       }
1510     }
1511     if (subset.size() == 0)
1512     {
1513       return null;
1514     }
1515     AlignmentAnnotation[] anns = new AlignmentAnnotation[subset.size()];
1516     int i = 0;
1517     e = subset.elements();
1518     while (e.hasMoreElements())
1519     {
1520       anns[i++] = e.nextElement();
1521     }
1522     subset.removeAllElements();
1523     return anns;
1524   }
1525
1526   @Override
1527   public boolean updatePDBIds()
1528   {
1529     if (datasetSequence != null)
1530     {
1531       // TODO: could merge DBRefs
1532       return datasetSequence.updatePDBIds();
1533     }
1534     if (dbrefs == null || dbrefs.length == 0)
1535     {
1536       return false;
1537     }
1538     boolean added = false;
1539     for (DBRefEntry dbr : dbrefs)
1540     {
1541       if (DBRefSource.PDB.equals(dbr.getSource()))
1542       {
1543         /*
1544          * 'Add' any PDB dbrefs as a PDBEntry - add is only performed if the
1545          * PDB id is not already present in a 'matching' PDBEntry
1546          * Constructor parses out a chain code if appended to the accession id
1547          * (a fudge used to 'store' the chain code in the DBRef)
1548          */
1549         PDBEntry pdbe = new PDBEntry(dbr);
1550         added |= addPDBId(pdbe);
1551       }
1552     }
1553     return added;
1554   }
1555
1556   @Override
1557   public void transferAnnotation(SequenceI entry, Mapping mp)
1558   {
1559     if (datasetSequence != null)
1560     {
1561       datasetSequence.transferAnnotation(entry, mp);
1562       return;
1563     }
1564     if (entry.getDatasetSequence() != null)
1565     {
1566       transferAnnotation(entry.getDatasetSequence(), mp);
1567       return;
1568     }
1569     // transfer any new features from entry onto sequence
1570     if (entry.getSequenceFeatures() != null)
1571     {
1572
1573       List<SequenceFeature> sfs = entry.getSequenceFeatures();
1574       for (SequenceFeature feature : sfs)
1575       {
1576         SequenceFeature sf[] = (mp != null) ? mp.locateFeature(feature)
1577                 : new SequenceFeature[] { new SequenceFeature(feature) };
1578         if (sf != null)
1579         {
1580           for (int sfi = 0; sfi < sf.length; sfi++)
1581           {
1582             addSequenceFeature(sf[sfi]);
1583           }
1584         }
1585       }
1586     }
1587
1588     // transfer PDB entries
1589     if (entry.getAllPDBEntries() != null)
1590     {
1591       Enumeration<PDBEntry> e = entry.getAllPDBEntries().elements();
1592       while (e.hasMoreElements())
1593       {
1594         PDBEntry pdb = e.nextElement();
1595         addPDBId(pdb);
1596       }
1597     }
1598     // transfer database references
1599     DBRefEntry[] entryRefs = entry.getDBRefs();
1600     if (entryRefs != null)
1601     {
1602       for (int r = 0; r < entryRefs.length; r++)
1603       {
1604         DBRefEntry newref = new DBRefEntry(entryRefs[r]);
1605         if (newref.getMap() != null && mp != null)
1606         {
1607           // remap ref using our local mapping
1608         }
1609         // we also assume all version string setting is done by dbSourceProxy
1610         /*
1611          * if (!newref.getSource().equalsIgnoreCase(dbSource)) {
1612          * newref.setSource(dbSource); }
1613          */
1614         addDBRef(newref);
1615       }
1616     }
1617   }
1618
1619   /**
1620    * @return The index (zero-based) on this sequence in the MSA. It returns
1621    *         {@code -1} if this information is not available.
1622    */
1623   @Override
1624   public int getIndex()
1625   {
1626     return index;
1627   }
1628
1629   /**
1630    * Defines the position of this sequence in the MSA. Use the value {@code -1}
1631    * if this information is undefined.
1632    *
1633    * @param The
1634    *          position for this sequence. This value is zero-based (zero for
1635    *          this first sequence)
1636    */
1637   @Override
1638   public void setIndex(int value)
1639   {
1640     index = value;
1641   }
1642
1643   @Override
1644   public void setRNA(RNA r)
1645   {
1646     rna = r;
1647   }
1648
1649   @Override
1650   public RNA getRNA()
1651   {
1652     return rna;
1653   }
1654
1655   @Override
1656   public List<AlignmentAnnotation> getAlignmentAnnotations(String calcId,
1657           String label)
1658   {
1659     List<AlignmentAnnotation> result = new ArrayList<AlignmentAnnotation>();
1660     if (this.annotation != null)
1661     {
1662       for (AlignmentAnnotation ann : annotation)
1663       {
1664         if (ann.calcId != null && ann.calcId.equals(calcId)
1665                 && ann.label != null && ann.label.equals(label))
1666         {
1667           result.add(ann);
1668         }
1669       }
1670     }
1671     return result;
1672   }
1673
1674   @Override
1675   public String toString()
1676   {
1677     return getDisplayId(false);
1678   }
1679
1680   @Override
1681   public PDBEntry getPDBEntry(String pdbIdStr)
1682   {
1683     if (getDatasetSequence() != null)
1684     {
1685       return getDatasetSequence().getPDBEntry(pdbIdStr);
1686     }
1687     if (pdbIds == null)
1688     {
1689       return null;
1690     }
1691     List<PDBEntry> entries = getAllPDBEntries();
1692     for (PDBEntry entry : entries)
1693     {
1694       if (entry.getId().equalsIgnoreCase(pdbIdStr))
1695       {
1696         return entry;
1697       }
1698     }
1699     return null;
1700   }
1701
1702   @Override
1703   public List<DBRefEntry> getPrimaryDBRefs()
1704   {
1705     if (datasetSequence != null)
1706     {
1707       return datasetSequence.getPrimaryDBRefs();
1708     }
1709     if (dbrefs == null || dbrefs.length == 0)
1710     {
1711       return Collections.emptyList();
1712     }
1713     synchronized (dbrefs)
1714     {
1715       List<DBRefEntry> primaries = new ArrayList<DBRefEntry>();
1716       DBRefEntry[] tmp = new DBRefEntry[1];
1717       for (DBRefEntry ref : dbrefs)
1718       {
1719         if (!ref.isPrimaryCandidate())
1720         {
1721           continue;
1722         }
1723         if (ref.hasMap())
1724         {
1725           MapList mp = ref.getMap().getMap();
1726           if (mp.getFromLowest() > start || mp.getFromHighest() < end)
1727           {
1728             // map only involves a subsequence, so cannot be primary
1729             continue;
1730           }
1731         }
1732         // whilst it looks like it is a primary ref, we also sanity check type
1733         if (DBRefUtils.getCanonicalName(DBRefSource.PDB).equals(
1734                 DBRefUtils.getCanonicalName(ref.getSource())))
1735         {
1736           // PDB dbrefs imply there should be a PDBEntry associated
1737           // TODO: tighten PDB dbrefs
1738           // formally imply Jalview has actually downloaded and
1739           // parsed the pdb file. That means there should be a cached file
1740           // handle on the PDBEntry, and a real mapping between sequence and
1741           // extracted sequence from PDB file
1742           PDBEntry pdbentry = getPDBEntry(ref.getAccessionId());
1743           if (pdbentry != null && pdbentry.getFile() != null)
1744           {
1745             primaries.add(ref);
1746           }
1747           continue;
1748         }
1749         // check standard protein or dna sources
1750         tmp[0] = ref;
1751         DBRefEntry[] res = DBRefUtils.selectDbRefs(!isProtein(), tmp);
1752         if (res != null && res[0] == tmp[0])
1753         {
1754           primaries.add(ref);
1755           continue;
1756         }
1757       }
1758       return primaries;
1759     }
1760   }
1761
1762   /**
1763    * {@inheritDoc}
1764    */
1765   @Override
1766   public List<SequenceFeature> findFeatures(int fromColumn, int toColumn,
1767           String... types)
1768   {
1769     int startPos = findPosition(fromColumn - 1); // convert base 1 to base 0
1770     int endPos = findPosition(toColumn - 1);
1771     // to trace / debug behaviour:
1772     // System.out
1773     // .println(String
1774     // .format("%s.findFeatures columns [%d-%d] positions [%d-%d] leaves cursor %s",
1775     // getName(), fromColumn, toColumn, startPos,
1776     // endPos, cursor));
1777     List<SequenceFeature> result = new ArrayList<>();
1778     if (datasetSequence != null)
1779     {
1780       result = datasetSequence.getFeatures().findFeatures(startPos, endPos,
1781               types);
1782     }
1783     else
1784     {
1785       result = sequenceFeatureStore.findFeatures(startPos, endPos, types);
1786     }
1787
1788     /*
1789      * if the start or end column is gapped, startPos or endPos may be to the
1790      * left or right, and we may have included adjacent or enclosing features;
1791      * remove any that are not enclosing, non-contact features
1792      */
1793     if (endPos > this.end || Comparison.isGap(sequence[fromColumn - 1])
1794             || Comparison.isGap(sequence[toColumn - 1]))
1795     {
1796       ListIterator<SequenceFeature> it = result.listIterator();
1797       while (it.hasNext())
1798       {
1799         SequenceFeature sf = it.next();
1800         int featureStartColumn = findIndex(sf.getBegin());
1801         int featureEndColumn = findIndex(sf.getEnd());
1802         boolean noOverlap = featureStartColumn > toColumn
1803                         || featureEndColumn < fromColumn;
1804
1805         /*
1806          * reject an 'enclosing' feature if it is actually a contact feature
1807          */
1808         if (sf.isContactFeature() && featureStartColumn < fromColumn
1809                 && featureEndColumn > toColumn)
1810         {
1811           noOverlap = true;
1812         }
1813         if (noOverlap)
1814         {
1815           it.remove();
1816         }
1817       }
1818     }
1819
1820     return result;
1821   }
1822
1823   /**
1824    * Invalidates any stale cursors (forcing recalculation) by incrementing the
1825    * token that has to match the one presented by the cursor
1826    */
1827   @Override
1828   public void sequenceChanged()
1829   {
1830     changeCount++;
1831   }
1832
1833   /**
1834    * {@inheritDoc}
1835    */
1836   @Override
1837   public int replace(char c1, char c2)
1838   {
1839     if (c1 == c2)
1840     {
1841       return 0;
1842     }
1843     int count = 0;
1844     synchronized (sequence)
1845     {
1846       for (int c = 0; c < sequence.length; c++)
1847       {
1848         if (sequence[c] == c1)
1849         {
1850           sequence[c] = c2;
1851           count++;
1852         }
1853       }
1854     }
1855     if (count > 0)
1856     {
1857       sequenceChanged();
1858     }
1859
1860     return count;
1861   }
1862 }