src/jalview/datamodel/Sequence.java

   1 /*
   2  * Jalview - A Sequence Alignment Editor and Viewer ($$Version-Rel$$)
   3  * Copyright (C) $$Year-Rel$$ The Jalview Authors
   4  *
   5  * This file is part of Jalview.
   6  *
   7  * Jalview is free software: you can redistribute it and/or
   8  * modify it under the terms of the GNU General Public License
   9  * as published by the Free Software Foundation, either version 3
  10  * of the License, or (at your option) any later version.
  11  *
  12  * Jalview is distributed in the hope that it will be useful, but
  13  * WITHOUT ANY WARRANTY; without even the implied warranty
  14  * of MERCHANTABILITY or FITNESS FOR A PARTICULAR
  15  * PURPOSE.  See the GNU General Public License for more details.
  16  *
  17  * You should have received a copy of the GNU General Public License
  18  * along with Jalview.  If not, see <http://www.gnu.org/licenses/>.
  19  * The Jalview Authors are detailed in the 'AUTHORS' file.
  20  */
  21 package jalview.datamodel;
  22
  23 import jalview.analysis.AlignSeq;
  24 import jalview.api.DBRefEntryI;
  25 import jalview.datamodel.features.SequenceFeatures;
  26 import jalview.datamodel.features.SequenceFeaturesI;
  27 import jalview.util.Comparison;
  28 import jalview.util.DBRefUtils;
  29 import jalview.util.MapList;
  30 import jalview.util.StringUtils;
  31
  32 import java.util.ArrayList;
  33 import java.util.Arrays;
  34 import java.util.BitSet;
  35 import java.util.Collections;
  36 import java.util.Enumeration;
  37 import java.util.List;
  38 import java.util.ListIterator;
  39 import java.util.Vector;
  40
  41 import com.stevesoft.pat.Regex;
  42
  43 import fr.orsay.lri.varna.models.rna.RNA;
  44
  45 /**
  46  *
  47  * Implements the SequenceI interface for a char[] based sequence object
  48  */
  49 public class Sequence extends ASequence implements SequenceI
  50 {
  51   private static final Regex limitrx = new Regex(
  52           "[/][0-9]{1,}[-][0-9]{1,}$");
  53
  54   private static final Regex endrx = new Regex("[0-9]{1,}$");
  55
  56   SequenceI datasetSequence;
  57
  58   String name;
  59
  60   private char[] sequence;
  61
  62   String description;
  63
  64   int start;
  65
  66   int end;
  67
  68   Vector<PDBEntry> pdbIds;
  69
  70   String vamsasId;
  71
  72   DBRefEntry[] dbrefs;
  73
  74   RNA rna;
  75
  76   /**
  77    * This annotation is displayed below the alignment but the positions are tied
  78    * to the residues of this sequence
  79    *
  80    * TODO: change to List<>
  81    */
  82   Vector<AlignmentAnnotation> annotation;
  83
  84   /**
  85    * The index of the sequence in a MSA
  86    */
  87   int index = -1;
  88
  89   private SequenceFeatures sequenceFeatureStore;
  90
  91   /*
  92    * A cursor holding the approximate current view position to the sequence,
  93    * as determined by findIndex or findPosition or findPositions.
  94    * Using a cursor as a hint allows these methods to be more performant for
  95    * large sequences.
  96    */
  97   private SequenceCursor cursor;
  98
  99   /*
 100    * A number that should be incremented whenever the sequence is edited.
 101    * If the value matches the cursor token, then we can trust the cursor,
 102    * if not then it should be recomputed.
 103    */
 104   private int changeCount;
 105
 106   /**
 107    * Creates a new Sequence object.
 108    *
 109    * @param name
 110    *          display name string
 111    * @param sequence
 112    *          string to form a possibly gapped sequence out of
 113    * @param start
 114    *          first position of non-gap residue in the sequence
 115    * @param end
 116    *          last position of ungapped residues (nearly always only used for
 117    *          display purposes)
 118    */
 119   public Sequence(String name, String sequence, int start, int end)
 120   {
 121     this();
 122     initSeqAndName(name, sequence.toCharArray(), start, end);
 123   }
 124
 125   public Sequence(String name, char[] sequence, int start, int end)
 126   {
 127     this();
 128     initSeqAndName(name, sequence, start, end);
 129   }
 130
 131   /**
 132    * Stage 1 constructor - assign name, sequence, and set start and end fields.
 133    * start and end are updated values from name2 if it ends with /start-end
 134    *
 135    * @param name2
 136    * @param sequence2
 137    * @param start2
 138    * @param end2
 139    */
 140   protected void initSeqAndName(String name2, char[] sequence2, int start2,
 141           int end2)
 142   {
 143     this.name = name2;
 144     this.sequence = sequence2;
 145     this.start = start2;
 146     this.end = end2;
 147     parseId();
 148     checkValidRange();
 149   }
 150
 151   void parseId()
 152   {
 153     if (name == null)
 154     {
 155       System.err
 156               .println("POSSIBLE IMPLEMENTATION ERROR: null sequence name passed to constructor.");
 157       name = "";
 158     }
 159     // Does sequence have the /start-end signature?
 160     if (limitrx.search(name))
 161     {
 162       name = limitrx.left();
 163       endrx.search(limitrx.stringMatched());
 164       setStart(Integer.parseInt(limitrx.stringMatched().substring(1,
 165               endrx.matchedFrom() - 1)));
 166       setEnd(Integer.parseInt(endrx.stringMatched()));
 167     }
 168   }
 169
 170   void checkValidRange()
 171   {
 172     // Note: JAL-774 :
 173     // http://issues.jalview.org/browse/JAL-774?focusedCommentId=11239&page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel#comment-11239
 174     {
 175       int endRes = 0;
 176       for (int j = 0; j < sequence.length; j++)
 177       {
 178         if (!jalview.util.Comparison.isGap(sequence[j]))
 179         {
 180           endRes++;
 181         }
 182       }
 183       if (endRes > 0)
 184       {
 185         endRes += start - 1;
 186       }
 187
 188       if (end < endRes)
 189       {
 190         end = endRes;
 191       }
 192     }
 193
 194   }
 195
 196   /**
 197    * default constructor
 198    */
 199   private Sequence()
 200   {
 201     sequenceFeatureStore = new SequenceFeatures();
 202   }
 203
 204   /**
 205    * Creates a new Sequence object.
 206    *
 207    * @param name
 208    *          DOCUMENT ME!
 209    * @param sequence
 210    *          DOCUMENT ME!
 211    */
 212   public Sequence(String name, String sequence)
 213   {
 214     this(name, sequence, 1, -1);
 215   }
 216
 217   /**
 218    * Creates a new Sequence object with new AlignmentAnnotations but inherits
 219    * any existing dataset sequence reference. If non exists, everything is
 220    * copied.
 221    *
 222    * @param seq
 223    *          if seq is a dataset sequence, behaves like a plain old copy
 224    *          constructor
 225    */
 226   public Sequence(SequenceI seq)
 227   {
 228     this(seq, seq.getAnnotation());
 229   }
 230
 231   /**
 232    * Create a new sequence object with new features, DBRefEntries, and PDBIds
 233    * but inherits any existing dataset sequence reference, and duplicate of any
 234    * annotation that is present in the given annotation array.
 235    *
 236    * @param seq
 237    *          the sequence to be copied
 238    * @param alAnnotation
 239    *          an array of annotation including some associated with seq
 240    */
 241   public Sequence(SequenceI seq, AlignmentAnnotation[] alAnnotation)
 242   {
 243     this();
 244     initSeqFrom(seq, alAnnotation);
 245   }
 246
 247   /**
 248    * does the heavy lifting when cloning a dataset sequence, or coping data from
 249    * dataset to a new derived sequence.
 250    *
 251    * @param seq
 252    *          - source of attributes.
 253    * @param alAnnotation
 254    *          - alignment annotation present on seq that should be copied onto
 255    *          this sequence
 256    */
 257   protected void initSeqFrom(SequenceI seq,
 258           AlignmentAnnotation[] alAnnotation)
 259   {
 260     char[] oseq = seq.getSequence(); // returns a copy of the array
 261     initSeqAndName(seq.getName(), oseq, seq.getStart(), seq.getEnd());
 262
 263     description = seq.getDescription();
 264     if (seq != datasetSequence)
 265     {
 266       setDatasetSequence(seq.getDatasetSequence());
 267     }
 268
 269     /*
 270      * only copy DBRefs and seqfeatures if we really are a dataset sequence
 271      */
 272     if (datasetSequence == null)
 273     {
 274       if (seq.getDBRefs() != null)
 275       {
 276         DBRefEntry[] dbr = seq.getDBRefs();
 277         for (int i = 0; i < dbr.length; i++)
 278         {
 279           addDBRef(new DBRefEntry(dbr[i]));
 280         }
 281       }
 282
 283       /*
 284        * make copies of any sequence features
 285        */
 286       for (SequenceFeature sf : seq.getSequenceFeatures())
 287       {
 288         addSequenceFeature(new SequenceFeature(sf));
 289       }
 290     }
 291
 292     if (seq.getAnnotation() != null)
 293     {
 294       AlignmentAnnotation[] sqann = seq.getAnnotation();
 295       for (int i = 0; i < sqann.length; i++)
 296       {
 297         if (sqann[i] == null)
 298         {
 299           continue;
 300         }
 301         boolean found = (alAnnotation == null);
 302         if (!found)
 303         {
 304           for (int apos = 0; !found && apos < alAnnotation.length; apos++)
 305           {
 306             found = (alAnnotation[apos] == sqann[i]);
 307           }
 308         }
 309         if (found)
 310         {
 311           // only copy the given annotation
 312           AlignmentAnnotation newann = new AlignmentAnnotation(sqann[i]);
 313           addAlignmentAnnotation(newann);
 314         }
 315       }
 316     }
 317     if (seq.getAllPDBEntries() != null)
 318     {
 319       Vector<PDBEntry> ids = seq.getAllPDBEntries();
 320       for (PDBEntry pdb : ids)
 321       {
 322         this.addPDBId(new PDBEntry(pdb));
 323       }
 324     }
 325   }
 326
 327   @Override
 328   public void setSequenceFeatures(List<SequenceFeature> features)
 329   {
 330     if (datasetSequence != null)
 331     {
 332       datasetSequence.setSequenceFeatures(features);
 333       return;
 334     }
 335     sequenceFeatureStore = new SequenceFeatures(features);
 336   }
 337
 338   @Override
 339   public synchronized boolean addSequenceFeature(SequenceFeature sf)
 340   {
 341     if (sf.getType() == null)
 342     {
 343       System.err.println("SequenceFeature type may not be null: "
 344               + sf.toString());
 345       return false;
 346     }
 347
 348     if (datasetSequence != null)
 349     {
 350       return datasetSequence.addSequenceFeature(sf);
 351     }
 352
 353     return sequenceFeatureStore.add(sf);
 354   }
 355
 356   @Override
 357   public void deleteFeature(SequenceFeature sf)
 358   {
 359     if (datasetSequence != null)
 360     {
 361       datasetSequence.deleteFeature(sf);
 362     }
 363     else
 364     {
 365       sequenceFeatureStore.delete(sf);
 366     }
 367   }
 368
 369   /**
 370    * {@inheritDoc}
 371    *
 372    * @return
 373    */
 374   @Override
 375   public List<SequenceFeature> getSequenceFeatures()
 376   {
 377     if (datasetSequence != null)
 378     {
 379       return datasetSequence.getSequenceFeatures();
 380     }
 381     return sequenceFeatureStore.getAllFeatures();
 382   }
 383
 384   @Override
 385   public SequenceFeaturesI getFeatures()
 386   {
 387     return datasetSequence != null ? datasetSequence.getFeatures()
 388             : sequenceFeatureStore;
 389   }
 390
 391   @Override
 392   public boolean addPDBId(PDBEntry entry)
 393   {
 394     if (pdbIds == null)
 395     {
 396       pdbIds = new Vector<PDBEntry>();
 397       pdbIds.add(entry);
 398       return true;
 399     }
 400
 401     for (PDBEntry pdbe : pdbIds)
 402     {
 403       if (pdbe.updateFrom(entry))
 404       {
 405         return false;
 406       }
 407     }
 408     pdbIds.addElement(entry);
 409     return true;
 410   }
 411
 412   /**
 413    * DOCUMENT ME!
 414    *
 415    * @param id
 416    *          DOCUMENT ME!
 417    */
 418   @Override
 419   public void setPDBId(Vector<PDBEntry> id)
 420   {
 421     pdbIds = id;
 422   }
 423
 424   /**
 425    * DOCUMENT ME!
 426    *
 427    * @return DOCUMENT ME!
 428    */
 429   @Override
 430   public Vector<PDBEntry> getAllPDBEntries()
 431   {
 432     return pdbIds == null ? new Vector<PDBEntry>() : pdbIds;
 433   }
 434
 435   /**
 436    * DOCUMENT ME!
 437    *
 438    * @return DOCUMENT ME!
 439    */
 440   @Override
 441   public String getDisplayId(boolean jvsuffix)
 442   {
 443     StringBuffer result = new StringBuffer(name);
 444     if (jvsuffix)
 445     {
 446       result.append("/" + start + "-" + end);
 447     }
 448
 449     return result.toString();
 450   }
 451
 452   /**
 453    * DOCUMENT ME!
 454    *
 455    * @param name
 456    *          DOCUMENT ME!
 457    */
 458   @Override
 459   public void setName(String name)
 460   {
 461     this.name = name;
 462     this.parseId();
 463   }
 464
 465   /**
 466    * DOCUMENT ME!
 467    *
 468    * @return DOCUMENT ME!
 469    */
 470   @Override
 471   public String getName()
 472   {
 473     return this.name;
 474   }
 475
 476   /**
 477    * DOCUMENT ME!
 478    *
 479    * @param start
 480    *          DOCUMENT ME!
 481    */
 482   @Override
 483   public void setStart(int start)
 484   {
 485     this.start = start;
 486   }
 487
 488   /**
 489    * DOCUMENT ME!
 490    *
 491    * @return DOCUMENT ME!
 492    */
 493   @Override
 494   public int getStart()
 495   {
 496     return this.start;
 497   }
 498
 499   /**
 500    * DOCUMENT ME!
 501    *
 502    * @param end
 503    *          DOCUMENT ME!
 504    */
 505   @Override
 506   public void setEnd(int end)
 507   {
 508     this.end = end;
 509   }
 510
 511   /**
 512    * DOCUMENT ME!
 513    *
 514    * @return DOCUMENT ME!
 515    */
 516   @Override
 517   public int getEnd()
 518   {
 519     return this.end;
 520   }
 521
 522   /**
 523    * DOCUMENT ME!
 524    *
 525    * @return DOCUMENT ME!
 526    */
 527   @Override
 528   public int getLength()
 529   {
 530     return this.sequence.length;
 531   }
 532
 533   /**
 534    * DOCUMENT ME!
 535    *
 536    * @param seq
 537    *          DOCUMENT ME!
 538    */
 539   @Override
 540   public void setSequence(String seq)
 541   {
 542     this.sequence = seq.toCharArray();
 543     checkValidRange();
 544     sequenceChanged();
 545   }
 546
 547   @Override
 548   public String getSequenceAsString()
 549   {
 550     return new String(sequence);
 551   }
 552
 553   @Override
 554   public String getSequenceAsString(int start, int end)
 555   {
 556     return new String(getSequence(start, end));
 557   }
 558
 559   @Override
 560   public char[] getSequence()
 561   {
 562     // return sequence;
 563     return sequence == null ? null : Arrays.copyOf(sequence,
 564             sequence.length);
 565   }
 566
 567   /*
 568    * (non-Javadoc)
 569    *
 570    * @see jalview.datamodel.SequenceI#getSequence(int, int)
 571    */
 572   @Override
 573   public char[] getSequence(int start, int end)
 574   {
 575     if (start < 0)
 576     {
 577       start = 0;
 578     }
 579     // JBPNote - left to user to pad the result here (TODO:Decide on this
 580     // policy)
 581     if (start >= sequence.length)
 582     {
 583       return new char[0];
 584     }
 585
 586     if (end >= sequence.length)
 587     {
 588       end = sequence.length;
 589     }
 590
 591     char[] reply = new char[end - start];
 592     System.arraycopy(sequence, start, reply, 0, end - start);
 593
 594     return reply;
 595   }
 596
 597   @Override
 598   public SequenceI getSubSequence(int start, int end)
 599   {
 600     if (start < 0)
 601     {
 602       start = 0;
 603     }
 604     char[] seq = getSequence(start, end);
 605     if (seq.length == 0)
 606     {
 607       return null;
 608     }
 609     int nstart = findPosition(start);
 610     int nend = findPosition(end) - 1;
 611     // JBPNote - this is an incomplete copy.
 612     SequenceI nseq = new Sequence(this.getName(), seq, nstart, nend);
 613     nseq.setDescription(description);
 614     if (datasetSequence != null)
 615     {
 616       nseq.setDatasetSequence(datasetSequence);
 617     }
 618     else
 619     {
 620       nseq.setDatasetSequence(this);
 621     }
 622     return nseq;
 623   }
 624
 625   /**
 626    * Returns the character of the aligned sequence at the given position (base
 627    * zero), or space if the position is not within the sequence's bounds
 628    *
 629    * @return
 630    */
 631   @Override
 632   public char getCharAt(int i)
 633   {
 634     if (i >= 0 && i < sequence.length)
 635     {
 636       return sequence[i];
 637     }
 638     else
 639     {
 640       return ' ';
 641     }
 642   }
 643
 644   /**
 645    * DOCUMENT ME!
 646    *
 647    * @param desc
 648    *          DOCUMENT ME!
 649    */
 650   @Override
 651   public void setDescription(String desc)
 652   {
 653     this.description = desc;
 654   }
 655
 656   /**
 657    * DOCUMENT ME!
 658    *
 659    * @return DOCUMENT ME!
 660    */
 661   @Override
 662   public String getDescription()
 663   {
 664     return this.description;
 665   }
 666
 667   /**
 668    * {@inheritDoc}
 669    */
 670   @Override
 671   public int findIndex(int pos)
 672   {
 673     /*
 674      * use a valid, hopefully nearby, cursor if available
 675      */
 676     if (isValidCursor(cursor))
 677     {
 678       return findIndex(pos, cursor);
 679     }
 680
 681     int j = start;
 682     int i = 0;
 683     int startColumn = 0;
 684
 685     /*
 686      * traverse sequence from the start counting gaps; make a note of
 687      * the column of the first residue to save in the cursor
 688      */
 689     while ((i < sequence.length) && (j <= end) && (j <= pos))
 690     {
 691       if (!Comparison.isGap(sequence[i]))
 692       {
 693         if (j == start)
 694         {
 695           startColumn = i;
 696         }
 697         j++;
 698       }
 699       i++;
 700     }
 701
 702     if (j == end && j < pos)
 703     {
 704       return end + 1;
 705     }
 706
 707     updateCursor(pos, i, startColumn);
 708     return i;
 709   }
 710
 711   /**
 712    * Updates the cursor to the latest found residue and column position
 713    *
 714    * @param residuePos
 715    *          (start..)
 716    * @param column
 717    *          (1..)
 718    * @param startColumn
 719    *          column position of the first sequence residue
 720    */
 721   protected void updateCursor(int residuePos, int column, int startColumn)
 722   {
 723     int endColumn = cursor == null ? 0 : cursor.lastResidueColumn;
 724     if (residuePos == this.end)
 725     {
 726       endColumn = column;
 727     }
 728
 729     cursor = new SequenceCursor(this, residuePos, column, startColumn,
 730             endColumn, this.changeCount);
 731   }
 732
 733   /**
 734    * Answers the aligned column position (1..) for the given residue position
 735    * (start..) given a 'hint' of a residue/column location in the neighbourhood.
 736    * The hint may be left of, at, or to the right of the required position.
 737    *
 738    * @param pos
 739    * @param curs
 740    * @return
 741    */
 742   protected int findIndex(int pos, SequenceCursor curs)
 743   {
 744     if (!isValidCursor(curs))
 745     {
 746       /*
 747        * wrong or invalidated cursor, compute de novo
 748        */
 749       return findIndex(pos);
 750     }
 751
 752     if (curs.residuePosition == pos)
 753     {
 754       return curs.columnPosition;
 755     }
 756
 757     /*
 758      * move left or right to find pos from hint.position
 759      */
 760     int col = curs.columnPosition - 1; // convert from base 1 to base 0
 761     int newPos = curs.residuePosition;
 762     int delta = newPos > pos ? -1 : 1;
 763
 764     while (newPos != pos)
 765     {
 766       col += delta; // shift one column left or right
 767       if (col < 0 || col == sequence.length)
 768       {
 769         break;
 770       }
 771       if (!Comparison.isGap(sequence[col]))
 772       {
 773         newPos += delta;
 774       }
 775     }
 776
 777     col++; // convert back to base 1
 778     updateCursor(pos, col, curs.firstResidueColumn);
 779
 780     return col;
 781   }
 782
 783   /**
 784    * {@inheritDoc}
 785    */
 786   @Override
 787   public Range findPositions(int fromColumn, int toColumn)
 788   {
 789     if (toColumn < fromColumn || fromColumn < 1)
 790     {
 791       return null;
 792     }
 793
 794     /*
 795      * find the first non-gapped position, if any
 796      */
 797     int firstPosition = 0;
 798     int col = fromColumn - 1;
 799     int length = sequence.length;
 800     while (col < length && col < toColumn)
 801     {
 802       if (!Comparison.isGap(sequence[col]))
 803       {
 804         firstPosition = findPosition(col++);
 805         break;
 806       }
 807       col++;
 808     }
 809
 810     if (firstPosition == 0)
 811     {
 812       return null;
 813     }
 814
 815     /*
 816      * find the last non-gapped position
 817      */
 818     int lastPosition = firstPosition;
 819     while (col < length && col < toColumn)
 820     {
 821       if (!Comparison.isGap(sequence[col++]))
 822       {
 823         lastPosition++;
 824       }
 825     }
 826
 827     return new Range(firstPosition, lastPosition);
 828   }
 829
 830   /**
 831    * {@inheritDoc}
 832    */
 833   @Override
 834   public int findPosition(final int column)
 835   {
 836     /*
 837      * use a valid, hopefully nearby, cursor if available
 838      */
 839     if (isValidCursor(cursor))
 840     {
 841       return findPosition(column + 1, cursor);
 842     }
 843
 844     // TODO recode this more naturally i.e. count residues only
 845     // as they are found, not 'in anticipation'
 846
 847     /*
 848      * traverse the sequence counting gaps; note the column position
 849      * of the first residue, to save in the cursor
 850      */
 851     int firstResidueColumn = 0;
 852     int lastPosFound = 0;
 853     int lastPosFoundColumn = 0;
 854     int seqlen = sequence.length;
 855
 856     if (seqlen > 0 && !Comparison.isGap(sequence[0]))
 857     {
 858       lastPosFound = start;
 859       lastPosFoundColumn = 0;
 860     }
 861
 862     int j = 0;
 863     int pos = start;
 864
 865     while (j < column && j < seqlen)
 866     {
 867       if (!Comparison.isGap(sequence[j]))
 868       {
 869         lastPosFound = pos;
 870         lastPosFoundColumn = j;
 871         if (pos == this.start)
 872         {
 873           firstResidueColumn = j;
 874         }
 875         pos++;
 876       }
 877       j++;
 878     }
 879     if (j < seqlen && !Comparison.isGap(sequence[j]))
 880     {
 881       lastPosFound = pos;
 882       lastPosFoundColumn = j;
 883       if (pos == this.start)
 884       {
 885         firstResidueColumn = j;
 886       }
 887     }
 888
 889     /*
 890      * update the cursor to the last residue position found (if any)
 891      * (converting column position to base 1)
 892      */
 893     if (lastPosFound != 0)
 894     {
 895       updateCursor(lastPosFound, lastPosFoundColumn + 1,
 896               firstResidueColumn + 1);
 897     }
 898
 899     return pos;
 900   }
 901
 902   /**
 903    * Answers true if the given cursor is not null, is for this sequence object,
 904    * and has a token value that matches this object's changeCount, else false.
 905    * This allows us to ignore a cursor as 'stale' if the sequence has been
 906    * modified since the cursor was created.
 907    *
 908    * @param curs
 909    * @return
 910    */
 911   protected boolean isValidCursor(SequenceCursor curs)
 912   {
 913     if (curs == null || curs.sequence != this || curs.token != changeCount)
 914     {
 915       return false;
 916     }
 917     /*
 918      * sanity check against range
 919      */
 920     if (curs.columnPosition < 0 || curs.columnPosition > sequence.length)
 921     {
 922       return false;
 923     }
 924     if (curs.residuePosition < start || curs.residuePosition > end)
 925     {
 926       return false;
 927     }
 928     return true;
 929   }
 930
 931   /**
 932    * Answers the sequence position (start..) for the given aligned column
 933    * position (1..), given a hint of a cursor in the neighbourhood. The cursor
 934    * may lie left of, at, or to the right of the column position.
 935    *
 936    * @param col
 937    * @param curs
 938    * @return
 939    */
 940   protected int findPosition(final int col, SequenceCursor curs)
 941   {
 942     if (!isValidCursor(curs))
 943     {
 944       /*
 945        * wrong or invalidated cursor, compute de novo
 946        */
 947       return findPosition(col - 1);// ugh back to base 0
 948     }
 949
 950     if (curs.columnPosition == col)
 951     {
 952       cursor = curs; // in case this method becomes public
 953       return curs.residuePosition; // easy case :-)
 954     }
 955
 956     if (curs.lastResidueColumn > 0 && curs.lastResidueColumn < col)
 957     {
 958       /*
 959        * sequence lies entirely to the left of col
 960        * - return last residue + 1
 961        */
 962       return end + 1;
 963     }
 964
 965     if (curs.firstResidueColumn > 0 && curs.firstResidueColumn > col)
 966     {
 967       /*
 968        * sequence lies entirely to the right of col
 969        * - return first residue
 970        */
 971       return start;
 972     }
 973
 974     // todo could choose closest to col out of column,
 975     // firstColumnPosition, lastColumnPosition as a start point
 976
 977     /*
 978      * move left or right to find pos from cursor position
 979      */
 980     int firstResidueColumn = curs.firstResidueColumn;
 981     int column = curs.columnPosition - 1; // to base 0
 982     int newPos = curs.residuePosition;
 983     int delta = curs.columnPosition > col ? -1 : 1;
 984     boolean gapped = false;
 985     int lastFoundPosition = curs.residuePosition;
 986     int lastFoundPositionColumn = curs.columnPosition;
 987
 988     while (column != col - 1)
 989     {
 990       column += delta; // shift one column left or right
 991       if (column < 0 || column == sequence.length)
 992       {
 993         break;
 994       }
 995       gapped = Comparison.isGap(sequence[column]);
 996       if (!gapped)
 997       {
 998         newPos += delta;
 999         lastFoundPosition = newPos;
1000         lastFoundPositionColumn = column + 1;
1001         if (lastFoundPosition == this.start)
1002         {
1003           firstResidueColumn = column + 1;
1004         }
1005       }
1006     }
1007
1008     if (cursor == null || lastFoundPosition != cursor.residuePosition)
1009     {
1010       updateCursor(lastFoundPosition, lastFoundPositionColumn,
1011               firstResidueColumn);
1012     }
1013
1014     /*
1015      * hack to give position to the right if on a gap
1016      * or beyond the length of the sequence (see JAL-2562)
1017      */
1018     if (delta > 0 && (gapped || column >= sequence.length))
1019     {
1020       newPos++;
1021     }
1022
1023     return newPos;
1024   }
1025
1026   /**
1027    * Returns an int array where indices correspond to each residue in the
1028    * sequence and the element value gives its position in the alignment
1029    *
1030    * @return int[SequenceI.getEnd()-SequenceI.getStart()+1] or null if no
1031    *         residues in SequenceI object
1032    */
1033   @Override
1034   public int[] gapMap()
1035   {
1036     String seq = jalview.analysis.AlignSeq.extractGaps(
1037             jalview.util.Comparison.GapChars, new String(sequence));
1038     int[] map = new int[seq.length()];
1039     int j = 0;
1040     int p = 0;
1041
1042     while (j < sequence.length)
1043     {
1044       if (!jalview.util.Comparison.isGap(sequence[j]))
1045       {
1046         map[p++] = j;
1047       }
1048
1049       j++;
1050     }
1051
1052     return map;
1053   }
1054
1055   @Override
1056   public int[] findPositionMap()
1057   {
1058     int map[] = new int[sequence.length];
1059     int j = 0;
1060     int pos = start;
1061     int seqlen = sequence.length;
1062     while ((j < seqlen))
1063     {
1064       map[j] = pos;
1065       if (!jalview.util.Comparison.isGap(sequence[j]))
1066       {
1067         pos++;
1068       }
1069
1070       j++;
1071     }
1072     return map;
1073   }
1074
1075   @Override
1076   public List<int[]> getInsertions()
1077   {
1078     ArrayList<int[]> map = new ArrayList<int[]>();
1079     int lastj = -1, j = 0;
1080     int pos = start;
1081     int seqlen = sequence.length;
1082     while ((j < seqlen))
1083     {
1084       if (jalview.util.Comparison.isGap(sequence[j]))
1085       {
1086         if (lastj == -1)
1087         {
1088           lastj = j;
1089         }
1090       }
1091       else
1092       {
1093         if (lastj != -1)
1094         {
1095           map.add(new int[] { lastj, j - 1 });
1096           lastj = -1;
1097         }
1098       }
1099       j++;
1100     }
1101     if (lastj != -1)
1102     {
1103       map.add(new int[] { lastj, j - 1 });
1104       lastj = -1;
1105     }
1106     return map;
1107   }
1108
1109   @Override
1110   public BitSet getInsertionsAsBits()
1111   {
1112     BitSet map = new BitSet();
1113     int lastj = -1, j = 0;
1114     int pos = start;
1115     int seqlen = sequence.length;
1116     while ((j < seqlen))
1117     {
1118       if (jalview.util.Comparison.isGap(sequence[j]))
1119       {
1120         if (lastj == -1)
1121         {
1122           lastj = j;
1123         }
1124       }
1125       else
1126       {
1127         if (lastj != -1)
1128         {
1129           map.set(lastj, j);
1130           lastj = -1;
1131         }
1132       }
1133       j++;
1134     }
1135     if (lastj != -1)
1136     {
1137       map.set(lastj, j);
1138       lastj = -1;
1139     }
1140     return map;
1141   }
1142
1143   @Override
1144   public void deleteChars(int i, int j)
1145   {
1146     int newstart = start, newend = end;
1147     if (i >= sequence.length || i < 0)
1148     {
1149       return;
1150     }
1151
1152     char[] tmp = StringUtils.deleteChars(sequence, i, j);
1153     boolean createNewDs = false;
1154     // TODO: take a (second look) at the dataset creation validation method for
1155     // the very large sequence case
1156     int eindex = -1, sindex = -1;
1157     boolean ecalc = false, scalc = false;
1158     for (int s = i; s < j; s++)
1159     {
1160       if (jalview.schemes.ResidueProperties.aaIndex[sequence[s]] != 23)
1161       {
1162         if (createNewDs)
1163         {
1164           newend--;
1165         }
1166         else
1167         {
1168           if (!scalc)
1169           {
1170             sindex = findIndex(start) - 1;
1171             scalc = true;
1172           }
1173           if (sindex == s)
1174           {
1175             // delete characters including start of sequence
1176             newstart = findPosition(j);
1177             break; // don't need to search for any more residue characters.
1178           }
1179           else
1180           {
1181             // delete characters after start.
1182             if (!ecalc)
1183             {
1184               eindex = findIndex(end) - 1;
1185               ecalc = true;
1186             }
1187             if (eindex < j)
1188             {
1189               // delete characters at end of sequence
1190               newend = findPosition(i - 1);
1191               break; // don't need to search for any more residue characters.
1192             }
1193             else
1194             {
1195               createNewDs = true;
1196               newend--; // decrease end position by one for the deleted residue
1197               // and search further
1198             }
1199           }
1200         }
1201       }
1202     }
1203     // deletion occured in the middle of the sequence
1204     if (createNewDs && this.datasetSequence != null)
1205     {
1206       // construct a new sequence
1207       Sequence ds = new Sequence(datasetSequence);
1208       // TODO: remove any non-inheritable properties ?
1209       // TODO: create a sequence mapping (since there is a relation here ?)
1210       ds.deleteChars(i, j);
1211       datasetSequence = ds;
1212     }
1213     start = newstart;
1214     end = newend;
1215     sequence = tmp;
1216     sequenceChanged();
1217   }
1218
1219   @Override
1220   public void insertCharAt(int i, int length, char c)
1221   {
1222     char[] tmp = new char[sequence.length + length];
1223
1224     if (i >= sequence.length)
1225     {
1226       System.arraycopy(sequence, 0, tmp, 0, sequence.length);
1227       i = sequence.length;
1228     }
1229     else
1230     {
1231       System.arraycopy(sequence, 0, tmp, 0, i);
1232     }
1233
1234     int index = i;
1235     while (length > 0)
1236     {
1237       tmp[index++] = c;
1238       length--;
1239     }
1240
1241     if (i < sequence.length)
1242     {
1243       System.arraycopy(sequence, i, tmp, index, sequence.length - i);
1244     }
1245
1246     sequence = tmp;
1247     sequenceChanged();
1248   }
1249
1250   @Override
1251   public void insertCharAt(int i, char c)
1252   {
1253     insertCharAt(i, 1, c);
1254   }
1255
1256   @Override
1257   public String getVamsasId()
1258   {
1259     return vamsasId;
1260   }
1261
1262   @Override
1263   public void setVamsasId(String id)
1264   {
1265     vamsasId = id;
1266   }
1267
1268   @Override
1269   public void setDBRefs(DBRefEntry[] dbref)
1270   {
1271     if (dbrefs == null && datasetSequence != null
1272             && this != datasetSequence)
1273     {
1274       datasetSequence.setDBRefs(dbref);
1275       return;
1276     }
1277     dbrefs = dbref;
1278     if (dbrefs != null)
1279     {
1280       DBRefUtils.ensurePrimaries(this);
1281     }
1282   }
1283
1284   @Override
1285   public DBRefEntry[] getDBRefs()
1286   {
1287     if (dbrefs == null && datasetSequence != null
1288             && this != datasetSequence)
1289     {
1290       return datasetSequence.getDBRefs();
1291     }
1292     return dbrefs;
1293   }
1294
1295   @Override
1296   public void addDBRef(DBRefEntry entry)
1297   {
1298     if (datasetSequence != null)
1299     {
1300       datasetSequence.addDBRef(entry);
1301       return;
1302     }
1303
1304     if (dbrefs == null)
1305     {
1306       dbrefs = new DBRefEntry[0];
1307     }
1308
1309     for (DBRefEntryI dbr : dbrefs)
1310     {
1311       if (dbr.updateFrom(entry))
1312       {
1313         /*
1314          * found a dbref that either matched, or could be
1315          * updated from, the new entry - no need to add it
1316          */
1317         return;
1318       }
1319     }
1320
1321     /*
1322      * extend the array to make room for one more
1323      */
1324     // TODO use an ArrayList instead
1325     int j = dbrefs.length;
1326     DBRefEntry[] temp = new DBRefEntry[j + 1];
1327     System.arraycopy(dbrefs, 0, temp, 0, j);
1328     temp[temp.length - 1] = entry;
1329
1330     dbrefs = temp;
1331
1332     DBRefUtils.ensurePrimaries(this);
1333   }
1334
1335   @Override
1336   public void setDatasetSequence(SequenceI seq)
1337   {
1338     if (seq == this)
1339     {
1340       throw new IllegalArgumentException(
1341               "Implementation Error: self reference passed to SequenceI.setDatasetSequence");
1342     }
1343     if (seq != null && seq.getDatasetSequence() != null)
1344     {
1345       throw new IllegalArgumentException(
1346               "Implementation error: cascading dataset sequences are not allowed.");
1347     }
1348     datasetSequence = seq;
1349   }
1350
1351   @Override
1352   public SequenceI getDatasetSequence()
1353   {
1354     return datasetSequence;
1355   }
1356
1357   @Override
1358   public AlignmentAnnotation[] getAnnotation()
1359   {
1360     return annotation == null ? null : annotation
1361             .toArray(new AlignmentAnnotation[annotation.size()]);
1362   }
1363
1364   @Override
1365   public boolean hasAnnotation(AlignmentAnnotation ann)
1366   {
1367     return annotation == null ? false : annotation.contains(ann);
1368   }
1369
1370   @Override
1371   public void addAlignmentAnnotation(AlignmentAnnotation annotation)
1372   {
1373     if (this.annotation == null)
1374     {
1375       this.annotation = new Vector<AlignmentAnnotation>();
1376     }
1377     if (!this.annotation.contains(annotation))
1378     {
1379       this.annotation.addElement(annotation);
1380     }
1381     annotation.setSequenceRef(this);
1382   }
1383
1384   @Override
1385   public void removeAlignmentAnnotation(AlignmentAnnotation annotation)
1386   {
1387     if (this.annotation != null)
1388     {
1389       this.annotation.removeElement(annotation);
1390       if (this.annotation.size() == 0)
1391       {
1392         this.annotation = null;
1393       }
1394     }
1395   }
1396
1397   /**
1398    * test if this is a valid candidate for another sequence's dataset sequence.
1399    *
1400    */
1401   private boolean isValidDatasetSequence()
1402   {
1403     if (datasetSequence != null)
1404     {
1405       return false;
1406     }
1407     for (int i = 0; i < sequence.length; i++)
1408     {
1409       if (jalview.util.Comparison.isGap(sequence[i]))
1410       {
1411         return false;
1412       }
1413     }
1414     return true;
1415   }
1416
1417   @Override
1418   public SequenceI deriveSequence()
1419   {
1420     Sequence seq = null;
1421     if (datasetSequence == null)
1422     {
1423       if (isValidDatasetSequence())
1424       {
1425         // Use this as dataset sequence
1426         seq = new Sequence(getName(), "", 1, -1);
1427         seq.setDatasetSequence(this);
1428         seq.initSeqFrom(this, getAnnotation());
1429         return seq;
1430       }
1431       else
1432       {
1433         // Create a new, valid dataset sequence
1434         createDatasetSequence();
1435       }
1436     }
1437     return new Sequence(this);
1438   }
1439
1440   private boolean _isNa;
1441
1442   private int _seqhash = 0;
1443
1444   /**
1445    * Answers false if the sequence is more than 85% nucleotide (ACGTU), else
1446    * true
1447    */
1448   @Override
1449   public boolean isProtein()
1450   {
1451     if (datasetSequence != null)
1452     {
1453       return datasetSequence.isProtein();
1454     }
1455     if (_seqhash != sequence.hashCode())
1456     {
1457       _seqhash = sequence.hashCode();
1458       _isNa = Comparison.isNucleotide(this);
1459     }
1460     return !_isNa;
1461   };
1462
1463   /*
1464    * (non-Javadoc)
1465    *
1466    * @see jalview.datamodel.SequenceI#createDatasetSequence()
1467    */
1468   @Override
1469   public SequenceI createDatasetSequence()
1470   {
1471     if (datasetSequence == null)
1472     {
1473       Sequence dsseq = new Sequence(getName(), AlignSeq.extractGaps(
1474               jalview.util.Comparison.GapChars, getSequenceAsString()),
1475               getStart(), getEnd());
1476
1477       datasetSequence = dsseq;
1478
1479       dsseq.setDescription(description);
1480       // move features and database references onto dataset sequence
1481       dsseq.sequenceFeatureStore = sequenceFeatureStore;
1482       sequenceFeatureStore = null;
1483       dsseq.dbrefs = dbrefs;
1484       dbrefs = null;
1485       // TODO: search and replace any references to this sequence with
1486       // references to the dataset sequence in Mappings on dbref
1487       dsseq.pdbIds = pdbIds;
1488       pdbIds = null;
1489       datasetSequence.updatePDBIds();
1490       if (annotation != null)
1491       {
1492         // annotation is cloned rather than moved, to preserve what's currently
1493         // on the alignment
1494         for (AlignmentAnnotation aa : annotation)
1495         {
1496           AlignmentAnnotation _aa = new AlignmentAnnotation(aa);
1497           _aa.sequenceRef = datasetSequence;
1498           _aa.adjustForAlignment(); // uses annotation's own record of
1499                                     // sequence-column mapping
1500           datasetSequence.addAlignmentAnnotation(_aa);
1501         }
1502       }
1503     }
1504     return datasetSequence;
1505   }
1506
1507   /*
1508    * (non-Javadoc)
1509    *
1510    * @see
1511    * jalview.datamodel.SequenceI#setAlignmentAnnotation(AlignmmentAnnotation[]
1512    * annotations)
1513    */
1514   @Override
1515   public void setAlignmentAnnotation(AlignmentAnnotation[] annotations)
1516   {
1517     if (annotation != null)
1518     {
1519       annotation.removeAllElements();
1520     }
1521     if (annotations != null)
1522     {
1523       for (int i = 0; i < annotations.length; i++)
1524       {
1525         if (annotations[i] != null)
1526         {
1527           addAlignmentAnnotation(annotations[i]);
1528         }
1529       }
1530     }
1531   }
1532
1533   @Override
1534   public AlignmentAnnotation[] getAnnotation(String label)
1535   {
1536     if (annotation == null || annotation.size() == 0)
1537     {
1538       return null;
1539     }
1540
1541     Vector<AlignmentAnnotation> subset = new Vector<AlignmentAnnotation>();
1542     Enumeration<AlignmentAnnotation> e = annotation.elements();
1543     while (e.hasMoreElements())
1544     {
1545       AlignmentAnnotation ann = e.nextElement();
1546       if (ann.label != null && ann.label.equals(label))
1547       {
1548         subset.addElement(ann);
1549       }
1550     }
1551     if (subset.size() == 0)
1552     {
1553       return null;
1554     }
1555     AlignmentAnnotation[] anns = new AlignmentAnnotation[subset.size()];
1556     int i = 0;
1557     e = subset.elements();
1558     while (e.hasMoreElements())
1559     {
1560       anns[i++] = e.nextElement();
1561     }
1562     subset.removeAllElements();
1563     return anns;
1564   }
1565
1566   @Override
1567   public boolean updatePDBIds()
1568   {
1569     if (datasetSequence != null)
1570     {
1571       // TODO: could merge DBRefs
1572       return datasetSequence.updatePDBIds();
1573     }
1574     if (dbrefs == null || dbrefs.length == 0)
1575     {
1576       return false;
1577     }
1578     boolean added = false;
1579     for (DBRefEntry dbr : dbrefs)
1580     {
1581       if (DBRefSource.PDB.equals(dbr.getSource()))
1582       {
1583         /*
1584          * 'Add' any PDB dbrefs as a PDBEntry - add is only performed if the
1585          * PDB id is not already present in a 'matching' PDBEntry
1586          * Constructor parses out a chain code if appended to the accession id
1587          * (a fudge used to 'store' the chain code in the DBRef)
1588          */
1589         PDBEntry pdbe = new PDBEntry(dbr);
1590         added |= addPDBId(pdbe);
1591       }
1592     }
1593     return added;
1594   }
1595
1596   @Override
1597   public void transferAnnotation(SequenceI entry, Mapping mp)
1598   {
1599     if (datasetSequence != null)
1600     {
1601       datasetSequence.transferAnnotation(entry, mp);
1602       return;
1603     }
1604     if (entry.getDatasetSequence() != null)
1605     {
1606       transferAnnotation(entry.getDatasetSequence(), mp);
1607       return;
1608     }
1609     // transfer any new features from entry onto sequence
1610     if (entry.getSequenceFeatures() != null)
1611     {
1612
1613       List<SequenceFeature> sfs = entry.getSequenceFeatures();
1614       for (SequenceFeature feature : sfs)
1615       {
1616         SequenceFeature sf[] = (mp != null) ? mp.locateFeature(feature)
1617                 : new SequenceFeature[] { new SequenceFeature(feature) };
1618         if (sf != null)
1619         {
1620           for (int sfi = 0; sfi < sf.length; sfi++)
1621           {
1622             addSequenceFeature(sf[sfi]);
1623           }
1624         }
1625       }
1626     }
1627
1628     // transfer PDB entries
1629     if (entry.getAllPDBEntries() != null)
1630     {
1631       Enumeration<PDBEntry> e = entry.getAllPDBEntries().elements();
1632       while (e.hasMoreElements())
1633       {
1634         PDBEntry pdb = e.nextElement();
1635         addPDBId(pdb);
1636       }
1637     }
1638     // transfer database references
1639     DBRefEntry[] entryRefs = entry.getDBRefs();
1640     if (entryRefs != null)
1641     {
1642       for (int r = 0; r < entryRefs.length; r++)
1643       {
1644         DBRefEntry newref = new DBRefEntry(entryRefs[r]);
1645         if (newref.getMap() != null && mp != null)
1646         {
1647           // remap ref using our local mapping
1648         }
1649         // we also assume all version string setting is done by dbSourceProxy
1650         /*
1651          * if (!newref.getSource().equalsIgnoreCase(dbSource)) {
1652          * newref.setSource(dbSource); }
1653          */
1654         addDBRef(newref);
1655       }
1656     }
1657   }
1658
1659   /**
1660    * @return The index (zero-based) on this sequence in the MSA. It returns
1661    *         {@code -1} if this information is not available.
1662    */
1663   @Override
1664   public int getIndex()
1665   {
1666     return index;
1667   }
1668
1669   /**
1670    * Defines the position of this sequence in the MSA. Use the value {@code -1}
1671    * if this information is undefined.
1672    *
1673    * @param The
1674    *          position for this sequence. This value is zero-based (zero for
1675    *          this first sequence)
1676    */
1677   @Override
1678   public void setIndex(int value)
1679   {
1680     index = value;
1681   }
1682
1683   @Override
1684   public void setRNA(RNA r)
1685   {
1686     rna = r;
1687   }
1688
1689   @Override
1690   public RNA getRNA()
1691   {
1692     return rna;
1693   }
1694
1695   @Override
1696   public List<AlignmentAnnotation> getAlignmentAnnotations(String calcId,
1697           String label)
1698   {
1699     List<AlignmentAnnotation> result = new ArrayList<AlignmentAnnotation>();
1700     if (this.annotation != null)
1701     {
1702       for (AlignmentAnnotation ann : annotation)
1703       {
1704         if (ann.calcId != null && ann.calcId.equals(calcId)
1705                 && ann.label != null && ann.label.equals(label))
1706         {
1707           result.add(ann);
1708         }
1709       }
1710     }
1711     return result;
1712   }
1713
1714   @Override
1715   public String toString()
1716   {
1717     return getDisplayId(false);
1718   }
1719
1720   @Override
1721   public PDBEntry getPDBEntry(String pdbIdStr)
1722   {
1723     if (getDatasetSequence() != null)
1724     {
1725       return getDatasetSequence().getPDBEntry(pdbIdStr);
1726     }
1727     if (pdbIds == null)
1728     {
1729       return null;
1730     }
1731     List<PDBEntry> entries = getAllPDBEntries();
1732     for (PDBEntry entry : entries)
1733     {
1734       if (entry.getId().equalsIgnoreCase(pdbIdStr))
1735       {
1736         return entry;
1737       }
1738     }
1739     return null;
1740   }
1741
1742   @Override
1743   public List<DBRefEntry> getPrimaryDBRefs()
1744   {
1745     if (datasetSequence != null)
1746     {
1747       return datasetSequence.getPrimaryDBRefs();
1748     }
1749     if (dbrefs == null || dbrefs.length == 0)
1750     {
1751       return Collections.emptyList();
1752     }
1753     synchronized (dbrefs)
1754     {
1755       List<DBRefEntry> primaries = new ArrayList<DBRefEntry>();
1756       DBRefEntry[] tmp = new DBRefEntry[1];
1757       for (DBRefEntry ref : dbrefs)
1758       {
1759         if (!ref.isPrimaryCandidate())
1760         {
1761           continue;
1762         }
1763         if (ref.hasMap())
1764         {
1765           MapList mp = ref.getMap().getMap();
1766           if (mp.getFromLowest() > start || mp.getFromHighest() < end)
1767           {
1768             // map only involves a subsequence, so cannot be primary
1769             continue;
1770           }
1771         }
1772         // whilst it looks like it is a primary ref, we also sanity check type
1773         if (DBRefUtils.getCanonicalName(DBRefSource.PDB).equals(
1774                 DBRefUtils.getCanonicalName(ref.getSource())))
1775         {
1776           // PDB dbrefs imply there should be a PDBEntry associated
1777           // TODO: tighten PDB dbrefs
1778           // formally imply Jalview has actually downloaded and
1779           // parsed the pdb file. That means there should be a cached file
1780           // handle on the PDBEntry, and a real mapping between sequence and
1781           // extracted sequence from PDB file
1782           PDBEntry pdbentry = getPDBEntry(ref.getAccessionId());
1783           if (pdbentry != null && pdbentry.getFile() != null)
1784           {
1785             primaries.add(ref);
1786           }
1787           continue;
1788         }
1789         // check standard protein or dna sources
1790         tmp[0] = ref;
1791         DBRefEntry[] res = DBRefUtils.selectDbRefs(!isProtein(), tmp);
1792         if (res != null && res[0] == tmp[0])
1793         {
1794           primaries.add(ref);
1795           continue;
1796         }
1797       }
1798       return primaries;
1799     }
1800   }
1801
1802   /**
1803    * {@inheritDoc}
1804    */
1805   @Override
1806   public List<SequenceFeature> findFeatures(int fromColumn, int toColumn,
1807           String... types)
1808   {
1809     int startPos = findPosition(fromColumn - 1); // convert base 1 to base 0
1810     int endPos = findPosition(toColumn - 1);
1811
1812     List<SequenceFeature> result = new ArrayList<>();
1813     if (datasetSequence != null)
1814     {
1815       result = datasetSequence.getFeatures().findFeatures(startPos, endPos,
1816               types);
1817     }
1818     else
1819     {
1820       result = sequenceFeatureStore.findFeatures(startPos, endPos, types);
1821     }
1822
1823     /*
1824      * if the start or end column is gapped, startPos or endPos may be to the
1825      * left or right, and we may have included adjacent or enclosing features;
1826      * remove any that are not enclosing, non-contact features
1827      */
1828     if (endPos > this.end || Comparison.isGap(sequence[fromColumn - 1])
1829             || Comparison.isGap(sequence[toColumn - 1]))
1830     {
1831       ListIterator<SequenceFeature> it = result.listIterator();
1832       while (it.hasNext())
1833       {
1834         SequenceFeature sf = it.next();
1835         int featureStartColumn = findIndex(sf.getBegin());
1836         int featureEndColumn = findIndex(sf.getEnd());
1837         boolean noOverlap = featureStartColumn > toColumn
1838                         || featureEndColumn < fromColumn;
1839
1840         /*
1841          * reject an 'enclosing' feature if it is actually a contact feature
1842          */
1843         if (sf.isContactFeature() && featureStartColumn < fromColumn
1844                 && featureEndColumn > toColumn)
1845         {
1846           noOverlap = true;
1847         }
1848         if (noOverlap)
1849         {
1850           it.remove();
1851         }
1852       }
1853     }
1854
1855     return result;
1856   }
1857
1858   /**
1859    * Invalidates any stale cursors (forcing recalculation) by incrementing the
1860    * token that has to match the one presented by the cursor
1861    */
1862   @Override
1863   public void sequenceChanged()
1864   {
1865     changeCount++;
1866   }
1867
1868   /**
1869    * {@inheritDoc}
1870    */
1871   @Override
1872   public int replace(char c1, char c2)
1873   {
1874     if (c1 == c2)
1875     {
1876       return 0;
1877     }
1878     int count = 0;
1879     synchronized (sequence)
1880     {
1881       for (int c = 0; c < sequence.length; c++)
1882       {
1883         if (sequence[c] == c1)
1884         {
1885           sequence[c] = c2;
1886           count++;
1887         }
1888       }
1889     }
1890     if (count > 0)
1891     {
1892       sequenceChanged();
1893     }
1894
1895     return count;
1896   }
1897 }