sync for cvs wierdness

author jprocter <Jim Procter>

Fri, 26 Mar 2010 14:31:59 +0000 (14:31 +0000)

committer jprocter <Jim Procter>

Fri, 26 Mar 2010 14:31:59 +0000 (14:31 +0000)
author jprocter <Jim Procter>
Fri, 26 Mar 2010 14:31:59 +0000 (14:31 +0000)
committer jprocter <Jim Procter>
Fri, 26 Mar 2010 14:31:59 +0000 (14:31 +0000)
diff --git a/src/jalview/util/GroupUrlLink.java b/src/jalview/util/GroupUrlLink.java

index f319eb1..55e3bd9 100644 (file)
--- a/src/jalview/util/GroupUrlLink.java
+++ b/src/jalview/util/GroupUrlLink.java
@@ -1,729 +1,814 @@
-/*
- * Jalview - A Sequence Alignment Editor and Viewer (Development Version 2.4.1)
- * Copyright (C) 2009 AM Waterhouse, J Procter, G Barton, M Clamp, S Searle
- * 
- * This program is free software; you can redistribute it and/or
- * modify it under the terms of the GNU General Public License
- * as published by the Free Software Foundation; either version 2
- * of the License, or (at your option) any later version.
- * 
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- * GNU General Public License for more details.
- * 
- * You should have received a copy of the GNU General Public License
- * along with this program; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA
- */
-package jalview.util;
-
-import jalview.datamodel.Sequence;
-import jalview.datamodel.SequenceI;
-
-import java.util.Hashtable;
-import java.util.Vector;
-
-public class GroupUrlLink
-{
-  /**
-   * Helper class based on the UrlLink class which enables URLs to be
-   * constructed from sequences or IDs associated with a group of sequences. URL
-   * definitions consist of a pipe separated string containing a <label>|<url
-   * construct>|<separator character>[|<sequence separator character>]. The url
-   * construct includes regex qualified tokens which are replaced with seuqence
-   * IDs ($SEQUENCE_IDS$) and/or seuqence regions ($SEQUENCES$) that are
-   * extracted from the group. See <code>UrlLink</code> for more information
-   * about the approach, and the original implementation.
-   * 
-   */
-  private String url_prefix, target, label;
-
-  /**
-   * these are all filled in order of the occurence of each token in the url
-   * string template
-   */
-  private String url_suffix[], separators[], regexReplace[];
-
-  private String invalidMessage = null;
-
-  /**
-   * tokens that can be replaced in the URL.
-   */
-  private static String[] tokens;
-
-  /**
-   * position of each token (which can appear once only) in the url
-   */
-  private int[] segs;
-
-  /**
-   * contains tokens in the order they appear in the URL template.
-   */
-  private String[] mtch;
-  static
-  {
-    if (tokens == null)
-    {
-      tokens = new String[]
-      { "SEQUENCEIDS", "SEQUENCES", "DATASETID" };
-    }
-  }
-
-  // private int idseg = -1, seqseg = -1;
-
-  /**
-   * parse the given linkString of the form '<label>|<url>|separator
-   * char[|optional sequence separator char]' into parts. url may contain a
-   * string $SEQUENCEIDS<=optional regex=>$ where <=optional regex=> must be of
-   * the form =/<perl style regex>/=$ or $SEQUENCES<=optional regex=>$ or
-   * $SEQUENCES<=optional regex=>$.
-   * 
-   * @param link
-   */
-  public GroupUrlLink(String link)
-  {
-    int sep = link.indexOf("|");
-    segs = new int[tokens.length];
-    int ntoks = 0;
-    for (int i = 0; i < segs.length; i++)
-    {
-      if ((segs[i] = link.indexOf("$" + tokens[i])) > -1)
-      {
-        ntoks++;
-      }
-    }
-    // expect at least one token
-    if (ntoks == 0)
-    {
-      invalidMessage = "Group URL string must contain at least one of ";
-      for (int i = 0; i < segs.length; i++)
-      {
-        invalidMessage += " '$" + tokens[i] + "[=/regex=/]$'";
-      }
-      return;
-    }
-
-    int[] ptok = new int[ntoks + 1];
-    String[] tmtch = new String[ntoks + 1];
-    mtch = new String[ntoks];
-    for (int i = 0, t = 0; i < segs.length; i++)
-    {
-      if (segs[i] > -1)
-      {
-        ptok[t] = segs[i];
-        tmtch[t++] = tokens[i];
-      }
-    }
-    ptok[ntoks] = link.length();
-    tmtch[ntoks] = "$$$$$$$$$";
-    jalview.util.QuickSort.sort(ptok, tmtch);
-    for (int i = 0; i < ntoks; i++)
-    {
-      mtch[i] = tmtch[i]; // TODO: check order is ascending
-    }
-    /*
-     * replaces the specific code below {}; if (psqids > -1 && pseqs > -1) { if
-     * (psqids > pseqs) { idseg = 1; seqseg = 0;
-     * 
-     * ptok = new int[] { pseqs, psqids, link.length() }; mtch = new String[] {
-     * "$SEQUENCES", "$SEQUENCEIDS" }; } else { idseg = 0; seqseg = 1; ptok =
-     * new int[] { psqids, pseqs, link.length() }; mtch = new String[] {
-     * "$SEQUENCEIDS", "$SEQUENCES" }; } } else { if (psqids != -1) { idseg = 0;
-     * ptok = new int[] { psqids, link.length() }; mtch = new String[] {
-     * "$SEQUENCEIDS" }; } else { seqseg = 0; ptok = new int[] { pseqs,
-     * link.length() }; mtch = new String[] { "$SEQUENCES" }; } }
-     */
-
-    int p = sep;
-    // first get the label and target part before the first |
-    do
-    {
-      sep = p;
-      p = link.indexOf("|", sep + 1);
-    } while (p > sep && p < ptok[0]);
-    // Assuming that the URL itself does not contain any '|' symbols
-    // sep now contains last pipe symbol position prior to any regex symbols
-    label = link.substring(0, sep);
-    if (label.indexOf("|") > -1)
-    {
-      // | terminated database name / www target at start of Label
-      target = label.substring(0, label.indexOf("|"));
-    }
-    else if (label.indexOf(" ") > 2)
-    {
-      // space separated Label - matches database name
-      target = label.substring(0, label.indexOf(" "));
-    }
-    else
-    {
-      target = label;
-    }
-    // Now Parse URL : Whole URL string first
-    url_prefix = link.substring(sep + 1, ptok[0]);
-    url_suffix = new String[mtch.length];
-    regexReplace = new String[mtch.length];
-    // and loop through tokens
-    for (int pass = 0; pass < mtch.length; pass++)
-    {
-      int mlength = 3 + mtch[pass].length();
-      if (link.indexOf("$" + mtch[pass] + "=/") == ptok[pass]
-              && (p = link.indexOf("/=$", ptok[pass] + mlength)) > ptok[pass]
-                      + mlength)
-      {
-        // Extract Regex and suffix
-        if (ptok[pass + 1] < p + 3)
-        {
-          // tokens are not allowed inside other tokens - e.g. inserting a
-          // $sequences$ into the regex match for the sequenceid
-          invalidMessage = "Token regexes cannot contain other regexes (did you terminate the $"
-                  + mtch[pass] + " regex with a '/=$' ?";
-          return;
-        }
-        url_suffix[pass] = link.substring(p + 3, ptok[pass + 1]);
-        regexReplace[pass] = link.substring(ptok[pass] + mlength, p);
-        try
-        {
-          com.stevesoft.pat.Regex rg = com.stevesoft.pat.Regex.perlCode("/"
-                  + regexReplace[pass] + "/");
-          if (rg == null)
-          {
-            invalidMessage = "Invalid Regular Expression : '"
-                    + regexReplace[pass] + "'\n";
-          }
-        } catch (Exception e)
-        {
-          invalidMessage = "Invalid Regular Expression : '"
-                  + regexReplace[pass] + "'\n";
-        }
-      }
-      else
-      {
-        regexReplace[pass] = null;
-        // verify format is really correct.
-        if ((p = link.indexOf("$" + mtch[pass] + "$")) == ptok[pass])
-        {
-          url_suffix[pass] = link.substring(p + mtch[pass].length() + 2,
-                  ptok[pass + 1]);
-        }
-        else
-        {
-          invalidMessage = "Warning: invalid regex structure (after '"
-                  + mtch[0] + "') for URL link : " + link;
-        }
-      }
-    }
-    int pass = 0;
-    separators = new String[url_suffix.length];
-    String suffices = url_suffix[url_suffix.length - 1], lastsep = ",";
-    // have a look in the last suffix for any more separators.
-    while ((p = suffices.indexOf('|')) > -1)
-    {
-      separators[pass] = suffices.substring(p + 1);
-      if (pass == 0)
-      {
-        // trim the original suffix string
-        url_suffix[url_suffix.length - 1] = suffices.substring(0, p);
-      }
-      else
-      {
-        lastsep = (separators[pass - 1] = separators[pass - 1].substring(0,
-                p));
-      }
-      suffices = separators[pass];
-      pass++;
-    }
-    if (pass > 0)
-    {
-      lastsep = separators[pass - 1];
-    }
-    // last separator is always used for all the remaining separators
-    while (pass < separators.length)
-    {
-      separators[pass++] = lastsep;
-    }
-  }
-
-  /**
-   * @return the url_suffix
-   */
-  public String getUrl_suffix()
-  {
-    return url_suffix[url_suffix.length - 1];
-  }
-
-  /**
-   * @return the url_prefix
-   */
-  public String getUrl_prefix()
-  {
-    return url_prefix;
-  }
-
-  /**
-   * @return the target
-   */
-  public String getTarget()
-  {
-    return target;
-  }
-
-  /**
-   * @return the label
-   */
-  public String getLabel()
-  {
-    return label;
-  }
-
-  /**
-   * @return the sequence ID regexReplace
-   */
-  public String getIDRegexReplace()
-  {
-    return _replaceFor(tokens[0]);
-  }
-
-  private String _replaceFor(String token)
-  {
-    for (int i = 0; i < mtch.length; i++)
-      if (segs[i] > -1 && mtch[i].equals(token))
-      {
-        return regexReplace[i];
-      }
-    return null;
-  }
-
-  /**
-   * @return the sequence ID regexReplace
-   */
-  public String getSeqRegexReplace()
-  {
-    return _replaceFor(tokens[1]);
-  }
-
-  /**
-   * @return the invalidMessage
-   */
-  public String getInvalidMessage()
-  {
-    return invalidMessage;
-  }
-
-  /**
-   * Check if URL string was parsed properly.
-   * 
-   * @return boolean - if false then <code>getInvalidMessage</code> returns an
-   *         error message
-   */
-  public boolean isValid()
-  {
-    return invalidMessage == null;
-  }
-
-  /**
-   * return one or more URL strings by applying regex to the given idstring
-   * 
-   * @param idstrings
-   *          array of id strings to pass to service
-   * @param seqstrings
-   *          array of seq strings to pass to service
-   * @param onlyIfMatches
-   *          - when true url strings are only made if regex is defined and
-   *          matches for all qualified tokens in groupURL - TODO: consider if
-   *          onlyIfMatches is really a useful parameter!
-   * @return null or Object[] { int[] { number of seqs substituted},boolean[] {
-   *         which seqs were substituted }, StringBuffer[] { substituted lists
-   *         for each token }, String[] { url } }
-   */
-  public Object[] makeUrls(String[] idstrings, String[] seqstrings,
-          String dsstring, boolean onlyIfMatches)
-  {
-    Hashtable rstrings = new Hashtable();
-    rstrings.put(tokens[0], idstrings);
-    rstrings.put(tokens[1], seqstrings);
-    rstrings.put(tokens[2], new String[]
-    { dsstring });
-    if (idstrings.length != seqstrings.length)
-    {
-      throw new Error(
-              "idstrings and seqstrings contain one string each per sequence.");
-    }
-    return makeUrls(rstrings, onlyIfMatches);
-  }
-
-  public Object[] makeUrls(Hashtable repstrings, boolean onlyIfMatches)
-  {
-    // prepare string arrays in correct order to be assembled into URL input
-    String[][] idseq = new String[mtch.length][]; // indexed by pass
-    int mins = 0, maxs = 0; // allowed two values, 1 or n-sequences.
-    for (int i = 0; i < mtch.length; i++)
-    {
-      idseq[i] = (String[]) repstrings.get(mtch[i]);
-      if (idseq[i].length >= 1)
-      {
-        if (mins == 0 && idseq[i].length == 1)
-        {
-          mins = 1;
-        }
-        if (maxs < 2)
-        {
-          maxs = idseq[i].length;
-        }
-        else
-        {
-          if (maxs != idseq[i].length)
-          {
-            throw new Error(
-                    "Cannot have mixed length replacement vectors. Replacement vector for "
-                            + (mtch[i]) + " is " + idseq[i].length
-                            + " strings long, and have already seen a "
-                            + maxs + " length vector.");
-          }
-        }
-      }
-      else
-      {
-        throw new Error(
-                "Cannot have zero length vector of replacement strings - either 1 value or n values.");
-      }
-    }
-    int pass = 0;
-    // iterate through input, collating segments to be inserted into url
-    StringBuffer matched[] = new StringBuffer[idseq.length];
-    // and precompile regexes
-    com.stevesoft.pat.Regex[] rgxs = new com.stevesoft.pat.Regex[matched.length];
-    for (pass = 0; pass < matched.length; pass++)
-    {
-      matched[pass] = new StringBuffer();
-      if (regexReplace[pass] != null)
-      {
-        rgxs[pass] = com.stevesoft.pat.Regex.perlCode("/" + regexReplace[pass]
-                + "/");
-      }
-      else
-      {
-        rgxs[pass] = null;
-      }
-    }
-    // record which of the input sequences were actually used to generate the
-    // url
-    boolean[] thismatched = new boolean[maxs];
-    int seqsmatched = 0;
-    for (int sq = 0; sq < maxs; sq++)
-    {
-      // initialise flag for match
-      thismatched[sq] = false;
-      String[] thematches = new String[rgxs.length];
-      for (pass = 0; pass < rgxs.length; pass++)
-      {
-        thematches[pass] = ""; // initialise - in case there are no more
-        // matches.
-        // if a regex is provided, then it must match for all sequences in all
-        // tokens for it to be considered.
-        if (idseq[pass].length <= sq)
-        {
-          // no more replacement strings to try for this token
-          continue;
-        }
-        if (rgxs[pass] != null)
-        {
-          com.stevesoft.pat.Regex rg = rgxs[pass];
-          int rematchat = 0;
-          // concatenate all matches of re in the given string!
-          while (rg.searchFrom(idseq[pass][sq], rematchat))
-          {
-            rematchat = rg.matchedTo();
-            thismatched[sq] |= true;
-            // do we take the cartesian products of the substituents ?
-            int ns = rg.numSubs();
-            if (ns == 0)
-            {
-              thematches[pass] += rg.stringMatched();// take whole regex
-            }
-            /*
-             * else if (ns==1) { // take only subgroup match return new String[]
-             * { rg.stringMatched(1), url_prefix+rg.stringMatched(1)+url_suffix
-             * }; }
-             */
-            // deal with multiple submatch case - for moment we do the simplest
-            // - concatenate the matched regions, instead of creating a complete
-            // list for each alternate match over all sequences.
-            // TODO: specify a 'replace pattern' - next refinement
-            else
-            {
-              // debug
-              for (int s = 0; s <= rg.numSubs(); s++)
-              {
-                System.err.println("Sub " + s + " : " + rg.matchedFrom(s)
-                        + " : " + rg.matchedTo(s) + " : '"
-                        + rg.stringMatched(s) + "'");
-              }
-              // try to collate subgroup matches
-              StringBuffer subs = new StringBuffer();
-              // have to loop through submatches, collating them at top level
-              // match
-              int s = 0; // 1;
-              while (s <= ns)
-              {
-                if (s + 1 <= ns && rg.matchedTo(s) > -1
-                        && rg.matchedTo(s + 1) > -1
-                        && rg.matchedTo(s + 1) < rg.matchedTo(s))
-                {
-                  // s is top level submatch. search for submatches enclosed by
-                  // this one
-                  int r = s + 1;
-                  String rmtch = "";
-                  while (r <= ns && rg.matchedTo(r) <= rg.matchedTo(s))
-                  {
-                    if (rg.matchedFrom(r) > -1)
-                    {
-                      rmtch += rg.stringMatched(r);
-                    }
-                    r++;
-                  }
-                  if (rmtch.length() > 0)
-                  {
-                    subs.append(rmtch); // simply concatenate
-                  }
-                  s = r;
-                }
-                else
-                {
-                  if (rg.matchedFrom(s) > -1)
-                  {
-                    subs.append(rg.stringMatched(s)); // concatenate
-                  }
-                  s++;
-                }
-              }
-              thematches[pass] += subs.toString();
-            }
-          }
-        }
-        else
-        {
-          // are we only supposed to take regex matches ?
-          if (!onlyIfMatches)
-          {
-            thismatched[sq] |= true;
-            thematches[pass] = idseq[pass][sq]; // take whole string -
-            // regardless - probably not a
-            // good idea!
-            /*
-             * TODO: do some boilerplate trimming of the fields to make them
-             * sensible e.g. trim off any 'prefix' in the id string (see UrlLink
-             * for the below) - pre 2.4 Jalview behaviour if
-             * (idstring.indexOf("|") > -1) { idstring =
-             * idstring.substring(idstring.lastIndexOf("|") + 1); }
-             */
-
-          }
-        }
-      }
-
-      // check if we are going to add this sequence's results ? all token
-      // replacements must be valid for this to happen!
-      // (including single value replacements - eg. dataset name)
-      if (thismatched[sq])
-      {
-        for (pass = 0; pass < matched.length; pass++)
-        {
-          if (idseq[pass].length > 1 && matched[pass].length() > 0)
-          {
-            matched[pass].append(separators[pass]);
-          }
-          matched[pass].append(thematches[pass]);
-        }
-        seqsmatched++;
-      }
-    }
-    // finally, if any sequences matched, then form the URL and return
-    if (matched[0].length() == 0)
-    {
-      // no matches - no url generated
-      return null;
-    }
-    StringBuffer submiturl = new StringBuffer();
-    submiturl.append(url_prefix);
-    for (pass = 0; pass < matched.length; pass++)
-    {
-      submiturl.append(matched[pass]);
-      if (url_suffix[pass] != null)
-      {
-        submiturl.append(url_suffix[pass]);
-      }
-    }
-
-    return new Object[]
-    { new int[]
-    { seqsmatched }, thismatched, matched, new String[]
-    { submiturl.toString() } };
-  }
-
-  /**
-   * get token types present in this url as a bitfield indicating presence of each token from tokens (LSB->MSB).
-   * @return groupURL class as integer
-   */
-  public int getGroupURLType()
-  {
-    int r = 0;
-    for (int pass = 0; pass < tokens.length; pass++)
-    {
-      for (int i = 0; i < mtch.length; i++)
-      {
-        if (mtch[i].equals(tokens[pass]))
-        {
-          r += 1 << pass;
-        }
-      }
-    }
-    return r;
-  }
-
-  public String toString()
-  {
-    StringBuffer result = new StringBuffer();
-    result.append(label + "|" + url_prefix);
-    int r;
-    for (r = 0; r < url_suffix.length; r++)
-    {
-      result.append("$");
-      result.append(mtch[r]);
-      if (regexReplace[r] != null)
-      {
-        result.append("=/");
-        result.append(regexReplace[r]);
-        result.append("/=");
-      }
-      result.append("$");
-      result.append(url_suffix[r]);
-    }
-    for (r = 0; r < separators.length; r++)
-    {
-      result.append("|");
-      result.append(separators[r]);
-    }
-    return result.toString();
-  }
-
-  /**
-   * report stats about the generated url string given an input set
-   * 
-   * @param ul
-   * @param idstring
-   * @param url
-   */
-  private static void testUrls(GroupUrlLink ul, String[][] idstring,
-          Object[] url)
-  {
-
-    if (url == null)
-    {
-      System.out.println("Created NO urls.");
-    }
-    else
-    {
-      System.out.println("Created a url from " + ((int[]) url[0])[0]
-              + "out of " + idstring[0].length + " sequences.");
-      System.out.println("Sequences that did not match:");
-      for (int sq = 0; sq < idstring[0].length; sq++)
-      {
-        if (!((boolean[]) url[1])[sq])
-        {
-          System.out.println("Seq " + sq + ": " + idstring[0][sq] + "\t: "
-                  + idstring[1][sq]);
-        }
-      }
-      System.out.println("Sequences that DID match:");
-      for (int sq = 0; sq < idstring[0].length; sq++)
-      {
-        if (((boolean[]) url[1])[sq])
-        {
-          System.out.println("Seq " + sq + ": " + idstring[0][sq] + "\t: "
-                  + idstring[1][sq]);
-        }
-      }
-      System.out.println("The generated URL:");
-      System.out.println(((String[]) url[3])[0]);
-    }
-  }
-
-  public static void main(String argv[])
-  {
-    String[] links = new String[]
-    {
-        "EnVision2|IDS|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Enfin%20Default%20Workflow&datasetName=linkInDatasetFromJalview&input=$SEQUENCEIDS$&inputType=0|,",
-        "EnVision2|Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Enfin%20Default%20Workflow&datasetName=linkInDatasetFromJalview&input=$SEQUENCES$&inputType=1|,",
-        "EnVision2|IDS|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Enfin%20Default%20Workflow&datasetName=$DATASETID$&input=$SEQUENCEIDS$&inputType=0|,",
-        "EnVision2|Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Enfin%20Default%20Workflow&datasetName=$DATASETID$&input=$SEQUENCES$&inputType=1|,",
-        "EnVision2|IDS|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=$SEQUENCEIDS$&datasetName=linkInDatasetFromJalview&input=$SEQUENCEIDS$&inputType=0|,",
-        "EnVision2|Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=$SEQUENCEIDS$&datasetName=$DATASETID$&input=$SEQUENCES$&inputType=1|,",
-        "EnVision2 Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Default&datasetName=JalviewSeqs$DATASETID$&input=$SEQUENCES=/([a-zA-Z]+)/=$&inputType=1|,",
-        "EnVision2 Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Default&datasetName=JalviewSeqs$DATASETID$&input=$SEQUENCES=/[A-Za-z]+/=$&inputType=1|,"
-    /*
-     * http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?input=P38389,P38398
-     * &inputType=0&workflow=Enfin%20Default%20Workflow&datasetName=
-     * linkInDatasetFromPRIDE
-     */
-    };
-
-    SequenceI[] seqs = new SequenceI[]
-    { new Sequence("StupidLabel:gi|9234|pdb|102L|A",
-            "asdiasdpasdpadpwpadasdpaspdw"), };
-    String[][] seqsandids = formStrings(seqs);
-    for (int i = 0; i < links.length; i++)
-    {
-      GroupUrlLink ul = new GroupUrlLink(links[i]);
-      if (ul.isValid())
-      {
-        System.out.println("\n\n\n");
-        System.out.println("Link " + i + " " + links[i] + " : "
-                + ul.toString());
-        System.out.println(" pref : " + ul.getUrl_prefix());
-        System.out.println(" IdReplace : " + ul.getIDRegexReplace());
-        System.out.println(" SeqReplace : " + ul.getSeqRegexReplace());
-        System.out.println(" Suffixes : " + ul.getUrl_suffix());
-
-        System.out
-                .println("<insert input id and sequence strings here> Without onlyIfMatches:");
-        Object[] urls = ul.makeUrls(seqsandids[0], seqsandids[1],
-                "mydataset", false);
-        testUrls(ul, seqsandids, urls);
-        System.out
-                .println("<insert input id and sequence strings here> With onlyIfMatches set:");
-        urls = ul.makeUrls(seqsandids[0], seqsandids[1], "mydataset", true);
-        testUrls(ul, seqsandids, urls);
-      }
-      else
-      {
-        System.err.println("Invalid URLLink : " + links[i] + " : "
-                + ul.getInvalidMessage());
-      }
-    }
-  }
-
-  /**
-   * covenience method to generate the id and sequence string vector from a set
-   * of seuqences using each sequence's getName() and getSequenceAsString()
-   * method
-   * 
-   * @param seqs
-   * @return String[][] {{sequence ids},{sequence strings}}
-   */
-  public static String[][] formStrings(SequenceI[] seqs)
-  {
-    String[][] idset = new String[2][seqs.length];
-    for (int i = 0; i < seqs.length; i++)
-    {
-      idset[0][i] = seqs[i].getName();
-      idset[1][i] = seqs[i].getSequenceAsString();
-    }
-    return idset;
-  }
-
-  public void setLabel(String newlabel)
-  {
-    this.label = newlabel;
-  }
-}
+/*\r
+ * Jalview - A Sequence Alignment Editor and Viewer (Development Version 2.4.1)\r
+ * Copyright (C) 2009 AM Waterhouse, J Procter, G Barton, M Clamp, S Searle\r
+ * \r
+ * This program is free software; you can redistribute it and/or\r
+ * modify it under the terms of the GNU General Public License\r
+ * as published by the Free Software Foundation; either version 2\r
+ * of the License, or (at your option) any later version.\r
+ * \r
+ * This program is distributed in the hope that it will be useful,\r
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of\r
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the\r
+ * GNU General Public License for more details.\r
+ * \r
+ * You should have received a copy of the GNU General Public License\r
+ * along with this program; if not, write to the Free Software\r
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA\r
+ */\r
+package jalview.util;\r
+\r
+import jalview.datamodel.Sequence;\r
+import jalview.datamodel.SequenceI;\r
+\r
+import java.util.Hashtable;\r
+import java.util.Vector;\r
+\r
+public class GroupUrlLink\r
+{\r
+  /**\r
+   * Helper class based on the UrlLink class which enables URLs to be\r
+   * constructed from sequences or IDs associated with a group of sequences. URL\r
+   * definitions consist of a pipe separated string containing a <label>|<url\r
+   * construct>|<separator character>[|<sequence separator character>]. The url\r
+   * construct includes regex qualified tokens which are replaced with seuqence\r
+   * IDs ($SEQUENCE_IDS$) and/or seuqence regions ($SEQUENCES$) that are\r
+   * extracted from the group. See <code>UrlLink</code> for more information\r
+   * about the approach, and the original implementation.\r
+   * Documentation to come. Note - groupUrls can be very big!\r
+   */\r
+  private String url_prefix, target, label;\r
+\r
+  /**\r
+   * these are all filled in order of the occurence of each token in the url\r
+   * string template\r
+   */\r
+  private String url_suffix[], separators[], regexReplace[];\r
+\r
+  private String invalidMessage = null;\r
+\r
+  /**\r
+   * tokens that can be replaced in the URL.\r
+   */\r
+  private static String[] tokens;\r
+\r
+  /**\r
+   * position of each token (which can appear once only) in the url\r
+   */\r
+  private int[] segs;\r
+\r
+  /**\r
+   * contains tokens in the order they appear in the URL template.\r
+   */\r
+  private String[] mtch;\r
+  static\r
+  {\r
+    if (tokens == null)\r
+    {\r
+      tokens = new String[]\r
+      { "SEQUENCEIDS", "SEQUENCES", "DATASETID" };\r
+    }\r
+  }\r
+\r
+  // private int idseg = -1, seqseg = -1;\r
+\r
+  /**\r
+   * parse the given linkString of the form '<label>|<url>|separator\r
+   * char[|optional sequence separator char]' into parts. url may contain a\r
+   * string $SEQUENCEIDS<=optional regex=>$ where <=optional regex=> must be of\r
+   * the form =/<perl style regex>/=$ or $SEQUENCES<=optional regex=>$ or\r
+   * $SEQUENCES<=optional regex=>$.\r
+   * \r
+   * @param link\r
+   */\r
+  public GroupUrlLink(String link)\r
+  {\r
+    int sep = link.indexOf("|");\r
+    segs = new int[tokens.length];\r
+    int ntoks = 0;\r
+    for (int i = 0; i < segs.length; i++)\r
+    {\r
+      if ((segs[i] = link.indexOf("$" + tokens[i])) > -1)\r
+      {\r
+        ntoks++;\r
+      }\r
+    }\r
+    // expect at least one token\r
+    if (ntoks == 0)\r
+    {\r
+      invalidMessage = "Group URL string must contain at least one of ";\r
+      for (int i = 0; i < segs.length; i++)\r
+      {\r
+        invalidMessage += " '$" + tokens[i] + "[=/regex=/]$'";\r
+      }\r
+      return;\r
+    }\r
+\r
+    int[] ptok = new int[ntoks + 1];\r
+    String[] tmtch = new String[ntoks + 1];\r
+    mtch = new String[ntoks];\r
+    for (int i = 0, t = 0; i < segs.length; i++)\r
+    {\r
+      if (segs[i] > -1)\r
+      {\r
+        ptok[t] = segs[i];\r
+        tmtch[t++] = tokens[i];\r
+      }\r
+    }\r
+    ptok[ntoks] = link.length();\r
+    tmtch[ntoks] = "$$$$$$$$$";\r
+    jalview.util.QuickSort.sort(ptok, tmtch);\r
+    for (int i = 0; i < ntoks; i++)\r
+    {\r
+      mtch[i] = tmtch[i]; // TODO: check order is ascending\r
+    }\r
+    /*\r
+     * replaces the specific code below {}; if (psqids > -1 && pseqs > -1) { if\r
+     * (psqids > pseqs) { idseg = 1; seqseg = 0;\r
+     * \r
+     * ptok = new int[] { pseqs, psqids, link.length() }; mtch = new String[] {\r
+     * "$SEQUENCES", "$SEQUENCEIDS" }; } else { idseg = 0; seqseg = 1; ptok =\r
+     * new int[] { psqids, pseqs, link.length() }; mtch = new String[] {\r
+     * "$SEQUENCEIDS", "$SEQUENCES" }; } } else { if (psqids != -1) { idseg = 0;\r
+     * ptok = new int[] { psqids, link.length() }; mtch = new String[] {\r
+     * "$SEQUENCEIDS" }; } else { seqseg = 0; ptok = new int[] { pseqs,\r
+     * link.length() }; mtch = new String[] { "$SEQUENCES" }; } }\r
+     */\r
+\r
+    int p = sep;\r
+    // first get the label and target part before the first |\r
+    do\r
+    {\r
+      sep = p;\r
+      p = link.indexOf("|", sep + 1);\r
+    } while (p > sep && p < ptok[0]);\r
+    // Assuming that the URL itself does not contain any '|' symbols\r
+    // sep now contains last pipe symbol position prior to any regex symbols\r
+    label = link.substring(0, sep);\r
+    if (label.indexOf("|") > -1)\r
+    {\r
+      // | terminated database name / www target at start of Label\r
+      target = label.substring(0, label.indexOf("|"));\r
+    }\r
+    else if (label.indexOf(" ") > 2)\r
+    {\r
+      // space separated Label - matches database name\r
+      target = label.substring(0, label.indexOf(" "));\r
+    }\r
+    else\r
+    {\r
+      target = label;\r
+    }\r
+    // Now Parse URL : Whole URL string first\r
+    url_prefix = link.substring(sep + 1, ptok[0]);\r
+    url_suffix = new String[mtch.length];\r
+    regexReplace = new String[mtch.length];\r
+    // and loop through tokens\r
+    for (int pass = 0; pass < mtch.length; pass++)\r
+    {\r
+      int mlength = 3 + mtch[pass].length();\r
+      if (link.indexOf("$" + mtch[pass] + "=/") == ptok[pass]\r
+              && (p = link.indexOf("/=$", ptok[pass] + mlength)) > ptok[pass]\r
+                      + mlength)\r
+      {\r
+        // Extract Regex and suffix\r
+        if (ptok[pass + 1] < p + 3)\r
+        {\r
+          // tokens are not allowed inside other tokens - e.g. inserting a\r
+          // $sequences$ into the regex match for the sequenceid\r
+          invalidMessage = "Token regexes cannot contain other regexes (did you terminate the $"\r
+                  + mtch[pass] + " regex with a '/=$' ?";\r
+          return;\r
+        }\r
+        url_suffix[pass] = link.substring(p + 3, ptok[pass + 1]);\r
+        regexReplace[pass] = link.substring(ptok[pass] + mlength, p);\r
+        try\r
+        {\r
+          com.stevesoft.pat.Regex rg = com.stevesoft.pat.Regex.perlCode("/"\r
+                  + regexReplace[pass] + "/");\r
+          if (rg == null)\r
+          {\r
+            invalidMessage = "Invalid Regular Expression : '"\r
+                    + regexReplace[pass] + "'\n";\r
+          }\r
+        } catch (Exception e)\r
+        {\r
+          invalidMessage = "Invalid Regular Expression : '"\r
+                  + regexReplace[pass] + "'\n";\r
+        }\r
+      }\r
+      else\r
+      {\r
+        regexReplace[pass] = null;\r
+        // verify format is really correct.\r
+        if ((p = link.indexOf("$" + mtch[pass] + "$")) == ptok[pass])\r
+        {\r
+          url_suffix[pass] = link.substring(p + mtch[pass].length() + 2,\r
+                  ptok[pass + 1]);\r
+        }\r
+        else\r
+        {\r
+          invalidMessage = "Warning: invalid regex structure (after '"\r
+                  + mtch[0] + "') for URL link : " + link;\r
+        }\r
+      }\r
+    }\r
+    int pass = 0;\r
+    separators = new String[url_suffix.length];\r
+    String suffices = url_suffix[url_suffix.length - 1], lastsep = ",";\r
+    // have a look in the last suffix for any more separators.\r
+    while ((p = suffices.indexOf('|')) > -1)\r
+    {\r
+      separators[pass] = suffices.substring(p + 1);\r
+      if (pass == 0)\r
+      {\r
+        // trim the original suffix string\r
+        url_suffix[url_suffix.length - 1] = suffices.substring(0, p);\r
+      }\r
+      else\r
+      {\r
+        lastsep = (separators[pass - 1] = separators[pass - 1].substring(0,\r
+                p));\r
+      }\r
+      suffices = separators[pass];\r
+      pass++;\r
+    }\r
+    if (pass > 0)\r
+    {\r
+      lastsep = separators[pass - 1];\r
+    }\r
+    // last separator is always used for all the remaining separators\r
+    while (pass < separators.length)\r
+    {\r
+      separators[pass++] = lastsep;\r
+    }\r
+  }\r
+\r
+  /**\r
+   * @return the url_suffix\r
+   */\r
+  public String getUrl_suffix()\r
+  {\r
+    return url_suffix[url_suffix.length - 1];\r
+  }\r
+\r
+  /**\r
+   * @return the url_prefix\r
+   */\r
+  public String getUrl_prefix()\r
+  {\r
+    return url_prefix;\r
+  }\r
+\r
+  /**\r
+   * @return the target\r
+   */\r
+  public String getTarget()\r
+  {\r
+    return target;\r
+  }\r
+\r
+  /**\r
+   * @return the label\r
+   */\r
+  public String getLabel()\r
+  {\r
+    return label;\r
+  }\r
+\r
+  /**\r
+   * @return the sequence ID regexReplace\r
+   */\r
+  public String getIDRegexReplace()\r
+  {\r
+    return _replaceFor(tokens[0]);\r
+  }\r
+\r
+  private String _replaceFor(String token)\r
+  {\r
+    for (int i = 0; i < mtch.length; i++)\r
+      if (segs[i] > -1 && mtch[i].equals(token))\r
+      {\r
+        return regexReplace[i];\r
+      }\r
+    return null;\r
+  }\r
+\r
+  /**\r
+   * @return the sequence ID regexReplace\r
+   */\r
+  public String getSeqRegexReplace()\r
+  {\r
+    return _replaceFor(tokens[1]);\r
+  }\r
+\r
+  /**\r
+   * @return the invalidMessage\r
+   */\r
+  public String getInvalidMessage()\r
+  {\r
+    return invalidMessage;\r
+  }\r
+\r
+  /**\r
+   * Check if URL string was parsed properly.\r
+   * \r
+   * @return boolean - if false then <code>getInvalidMessage</code> returns an\r
+   *         error message\r
+   */\r
+  public boolean isValid()\r
+  {\r
+    return invalidMessage == null;\r
+  }\r
+\r
+  /**\r
+   * return one or more URL strings by applying regex to the given idstring\r
+   * \r
+   * @param idstrings\r
+   *          array of id strings to pass to service\r
+   * @param seqstrings\r
+   *          array of seq strings to pass to service\r
+   * @param onlyIfMatches\r
+   *          - when true url strings are only made if regex is defined and\r
+   *          matches for all qualified tokens in groupURL - TODO: consider if\r
+   *          onlyIfMatches is really a useful parameter!\r
+   * @return null or Object[] { int[] { number of seqs substituted},boolean[] {\r
+   *         which seqs were substituted }, StringBuffer[] { substituted lists\r
+   *         for each token }, String[] { url } }\r
+   */\r
+  public Object[] makeUrls(String[] idstrings, String[] seqstrings,\r
+          String dsstring, boolean onlyIfMatches)\r
+  {\r
+    Hashtable rstrings = replacementArgs(idstrings, seqstrings, dsstring);\r
+    return makeUrls(rstrings, onlyIfMatches);\r
+  }\r
+\r
+  /**\r
+   * gathers input into a hashtable\r
+   * @param idstrings\r
+   * @param seqstrings\r
+   * @param dsstring\r
+   * @return\r
+   */\r
+  private Hashtable replacementArgs(String[] idstrings,\r
+          String[] seqstrings, String dsstring)\r
+  {\r
+    Hashtable rstrings = new Hashtable();\r
+    rstrings.put(tokens[0], idstrings);\r
+    rstrings.put(tokens[1], seqstrings);\r
+    rstrings.put(tokens[2], new String[]\r
+    { dsstring });\r
+    if (idstrings.length != seqstrings.length)\r
+    {\r
+      throw new Error(\r
+              "idstrings and seqstrings contain one string each per sequence.");\r
+    }\r
+    return rstrings;\r
+  }\r
+\r
+  public Object[] makeUrls(Hashtable repstrings, boolean onlyIfMatches)\r
+  {\r
+    return makeUrlsIf(true,repstrings,onlyIfMatches);\r
+  }\r
+  /**\r
+   * \r
+   * @param ids\r
+   * @param seqstr\r
+   * @param string\r
+   * @param b\r
+   * @return URL stub objects ready to pass to constructFrom  \r
+   */\r
+  public Object[] makeUrlStubs(String[] ids, String[] seqstr,\r
+          String string, boolean b)\r
+  {\r
+    Hashtable rstrings = replacementArgs(ids, seqstr, string);\r
+    Object[] stubs = makeUrlsIf(false, rstrings, b);\r
+    if (stubs!=null)\r
+    {\r
+      return new Object[] { stubs[0], stubs[1], rstrings, new boolean[] { b } };\r
+    }\r
+    // TODO Auto-generated method stub\r
+    return null;\r
+  }\r
+\r
+  /**\r
+   * generate the URL for the given URL stub object array returned from makeUrlStubs\r
+   * @param stubs\r
+   * @return URL string.\r
+   */\r
+  public String constructFrom(Object[] stubs)\r
+  {\r
+    Object[] results = makeUrlsIf(true, (Hashtable) stubs[2], ((boolean[])stubs[3])[0]);    \r
+    return ((String[]) results[3])[0];\r
+  }\r
+  /**\r
+   * conditionally generate urls or stubs for a given input.\r
+   * @param createFullUrl set to false if you only want to test if URLs would be generated.\r
+   * @param repstrings\r
+   * @param onlyIfMatches\r
+   * @return null if no url is generated. Object[] { int[] { number of matches seqs }, boolean[] { which matched }, (if createFullUrl also has StringBuffer[] { segment generated from inputs that is used in URL }, String[] { url })}\r
+   */\r
+  protected Object[] makeUrlsIf(boolean createFullUrl, Hashtable repstrings, boolean onlyIfMatches)\r
+  {\r
+    // prepare string arrays in correct order to be assembled into URL input\r
+    String[][] idseq = new String[mtch.length][]; // indexed by pass\r
+    int mins = 0, maxs = 0; // allowed two values, 1 or n-sequences.\r
+    for (int i = 0; i < mtch.length; i++)\r
+    {\r
+      idseq[i] = (String[]) repstrings.get(mtch[i]);\r
+      if (idseq[i].length >= 1)\r
+      {\r
+        if (mins == 0 && idseq[i].length == 1)\r
+        {\r
+          mins = 1;\r
+        }\r
+        if (maxs < 2)\r
+        {\r
+          maxs = idseq[i].length;\r
+        }\r
+        else\r
+        {\r
+          if (maxs != idseq[i].length)\r
+          {\r
+            throw new Error(\r
+                    "Cannot have mixed length replacement vectors. Replacement vector for "\r
+                            + (mtch[i]) + " is " + idseq[i].length\r
+                            + " strings long, and have already seen a "\r
+                            + maxs + " length vector.");\r
+          }\r
+        }\r
+      }\r
+      else\r
+      {\r
+        throw new Error(\r
+                "Cannot have zero length vector of replacement strings - either 1 value or n values.");\r
+      }\r
+    }\r
+    int pass = 0;\r
+    // iterate through input, collating segments to be inserted into url\r
+    StringBuffer matched[] = new StringBuffer[idseq.length];\r
+    // and precompile regexes\r
+    com.stevesoft.pat.Regex[] rgxs = new com.stevesoft.pat.Regex[matched.length];\r
+    for (pass = 0; pass < matched.length; pass++)\r
+    {\r
+      matched[pass] = new StringBuffer();\r
+      if (regexReplace[pass] != null)\r
+      {\r
+        rgxs[pass] = com.stevesoft.pat.Regex.perlCode("/" + regexReplace[pass]\r
+                + "/");\r
+      }\r
+      else\r
+      {\r
+        rgxs[pass] = null;\r
+      }\r
+    }\r
+    // record which of the input sequences were actually used to generate the\r
+    // url\r
+    boolean[] thismatched = new boolean[maxs];\r
+    int seqsmatched = 0;\r
+    for (int sq = 0; sq < maxs; sq++)\r
+    {\r
+      // initialise flag for match\r
+      thismatched[sq] = false;\r
+      String[] thematches = new String[rgxs.length];\r
+      for (pass = 0; pass < rgxs.length; pass++)\r
+      {\r
+        thematches[pass] = ""; // initialise - in case there are no more\r
+        // matches.\r
+        // if a regex is provided, then it must match for all sequences in all\r
+        // tokens for it to be considered.\r
+        if (idseq[pass].length <= sq)\r
+        {\r
+          // no more replacement strings to try for this token\r
+          continue;\r
+        }\r
+        if (rgxs[pass] != null)\r
+        {\r
+          com.stevesoft.pat.Regex rg = rgxs[pass];\r
+          int rematchat = 0;\r
+          // concatenate all matches of re in the given string!\r
+          while (rg.searchFrom(idseq[pass][sq], rematchat))\r
+          {\r
+            rematchat = rg.matchedTo();\r
+            thismatched[sq] |= true;\r
+            if (!createFullUrl)\r
+            {\r
+              continue; // don't bother making the URL replacement text.\r
+            }\r
+            // do we take the cartesian products of the substituents ?\r
+            int ns = rg.numSubs();\r
+            if (ns == 0)\r
+            {\r
+              thematches[pass] += rg.stringMatched();// take whole regex\r
+            }\r
+            /*\r
+             * else if (ns==1) { // take only subgroup match return new String[]\r
+             * { rg.stringMatched(1), url_prefix+rg.stringMatched(1)+url_suffix\r
+             * }; }\r
+             */\r
+            // deal with multiple submatch case - for moment we do the simplest\r
+            // - concatenate the matched regions, instead of creating a complete\r
+            // list for each alternate match over all sequences.\r
+            // TODO: specify a 'replace pattern' - next refinement\r
+            else\r
+            {\r
+              // debug\r
+              for (int s = 0; s <= rg.numSubs(); s++)\r
+              {\r
+                System.err.println("Sub " + s + " : " + rg.matchedFrom(s)\r
+                        + " : " + rg.matchedTo(s) + " : '"\r
+                        + rg.stringMatched(s) + "'");\r
+              }\r
+              // try to collate subgroup matches\r
+              StringBuffer subs = new StringBuffer();\r
+              // have to loop through submatches, collating them at top level\r
+              // match\r
+              int s = 0; // 1;\r
+              while (s <= ns)\r
+              {\r
+                if (s + 1 <= ns && rg.matchedTo(s) > -1\r
+                        && rg.matchedTo(s + 1) > -1\r
+                        && rg.matchedTo(s + 1) < rg.matchedTo(s))\r
+                {\r
+                  // s is top level submatch. search for submatches enclosed by\r
+                  // this one\r
+                  int r = s + 1;\r
+                  String rmtch = "";\r
+                  while (r <= ns && rg.matchedTo(r) <= rg.matchedTo(s))\r
+                  {\r
+                    if (rg.matchedFrom(r) > -1)\r
+                    {\r
+                      rmtch += rg.stringMatched(r);\r
+                    }\r
+                    r++;\r
+                  }\r
+                  if (rmtch.length() > 0)\r
+                  {\r
+                    subs.append(rmtch); // simply concatenate\r
+                  }\r
+                  s = r;\r
+                }\r
+                else\r
+                {\r
+                  if (rg.matchedFrom(s) > -1)\r
+                  {\r
+                    subs.append(rg.stringMatched(s)); // concatenate\r
+                  }\r
+                  s++;\r
+                }\r
+              }\r
+              thematches[pass] += subs.toString();\r
+            }\r
+          }\r
+        }\r
+        else\r
+        {\r
+          // are we only supposed to take regex matches ?\r
+          if (!onlyIfMatches)\r
+          {\r
+            thismatched[sq] |= true;\r
+            if (createFullUrl)\r
+            {\r
+            thematches[pass] = idseq[pass][sq]; // take whole string -\r
+            // regardless - probably not a\r
+            // good idea!\r
+            /*\r
+             * TODO: do some boilerplate trimming of the fields to make them\r
+             * sensible e.g. trim off any 'prefix' in the id string (see UrlLink\r
+             * for the below) - pre 2.4 Jalview behaviour if\r
+             * (idstring.indexOf("|") > -1) { idstring =\r
+             * idstring.substring(idstring.lastIndexOf("|") + 1); }\r
+             */\r
+            }\r
+            \r
+          }\r
+        }\r
+      }\r
+\r
+      // check if we are going to add this sequence's results ? all token\r
+      // replacements must be valid for this to happen!\r
+      // (including single value replacements - eg. dataset name)\r
+      if (thismatched[sq])\r
+      {\r
+        if (createFullUrl) {\r
+          for (pass = 0; pass < matched.length; pass++)\r
+          {\r
+          if (idseq[pass].length > 1 && matched[pass].length() > 0)\r
+          {\r
+            matched[pass].append(separators[pass]);\r
+          }\r
+            matched[pass].append(thematches[pass]);\r
+          }\r
+        }\r
+        seqsmatched++;\r
+      }\r
+    }\r
+    // finally, if any sequences matched, then form the URL and return\r
+    if (seqsmatched==0 || (createFullUrl && matched[0].length() == 0))\r
+    {\r
+      // no matches - no url generated\r
+      return null;\r
+    }\r
+    if (!createFullUrl)\r
+    {\r
+      // just return the essential info about what the URL would be generated from\r
+      return new Object[]\r
+                        { new int[]\r
+                        { seqsmatched }, thismatched};\r
+    }\r
+    // otherwise, create the URL completely.\r
+    StringBuffer submiturl = new StringBuffer();\r
+    submiturl.append(url_prefix);\r
+    for (pass = 0; pass < matched.length; pass++)\r
+    {\r
+      submiturl.append(matched[pass]);\r
+      if (url_suffix[pass] != null)\r
+      {\r
+        submiturl.append(url_suffix[pass]);\r
+      }\r
+    }\r
+\r
+    return new Object[]\r
+    { new int[]\r
+    { seqsmatched }, thismatched, matched, new String[]\r
+    { submiturl.toString() } };\r
+  }\r
+\r
+  /**\r
+   * \r
+   * @param urlstub\r
+   * @return number of distinct sequence (id or seuqence) replacements predicted for this stub\r
+   */\r
+  public int getNumberInvolved(Object[] urlstub)\r
+  {\r
+    return ((int[])urlstub[0])[0]; // returns seqsmatched from makeUrlsIf(false,...)\r
+  }\r
+\r
+  /**\r
+   * get token types present in this url as a bitfield indicating presence of each token from tokens (LSB->MSB).\r
+   * @return groupURL class as integer\r
+   */\r
+  public int getGroupURLType()\r
+  {\r
+    int r = 0;\r
+    for (int pass = 0; pass < tokens.length; pass++)\r
+    {\r
+      for (int i = 0; i < mtch.length; i++)\r
+      {\r
+        if (mtch[i].equals(tokens[pass]))\r
+        {\r
+          r += 1 << pass;\r
+        }\r
+      }\r
+    }\r
+    return r;\r
+  }\r
+\r
+  public String toString()\r
+  {\r
+    StringBuffer result = new StringBuffer();\r
+    result.append(label + "|" + url_prefix);\r
+    int r;\r
+    for (r = 0; r < url_suffix.length; r++)\r
+    {\r
+      result.append("$");\r
+      result.append(mtch[r]);\r
+      if (regexReplace[r] != null)\r
+      {\r
+        result.append("=/");\r
+        result.append(regexReplace[r]);\r
+        result.append("/=");\r
+      }\r
+      result.append("$");\r
+      result.append(url_suffix[r]);\r
+    }\r
+    for (r = 0; r < separators.length; r++)\r
+    {\r
+      result.append("|");\r
+      result.append(separators[r]);\r
+    }\r
+    return result.toString();\r
+  }\r
+\r
+  /**\r
+   * report stats about the generated url string given an input set\r
+   * \r
+   * @param ul\r
+   * @param idstring\r
+   * @param url\r
+   */\r
+  private static void testUrls(GroupUrlLink ul, String[][] idstring,\r
+          Object[] url)\r
+  {\r
+\r
+    if (url == null)\r
+    {\r
+      System.out.println("Created NO urls.");\r
+    }\r
+    else\r
+    {\r
+      System.out.println("Created a url from " + ((int[]) url[0])[0]\r
+              + "out of " + idstring[0].length + " sequences.");\r
+      System.out.println("Sequences that did not match:");\r
+      for (int sq = 0; sq < idstring[0].length; sq++)\r
+      {\r
+        if (!((boolean[]) url[1])[sq])\r
+        {\r
+          System.out.println("Seq " + sq + ": " + idstring[0][sq] + "\t: "\r
+                  + idstring[1][sq]);\r
+        }\r
+      }\r
+      System.out.println("Sequences that DID match:");\r
+      for (int sq = 0; sq < idstring[0].length; sq++)\r
+      {\r
+        if (((boolean[]) url[1])[sq])\r
+        {\r
+          System.out.println("Seq " + sq + ": " + idstring[0][sq] + "\t: "\r
+                  + idstring[1][sq]);\r
+        }\r
+      }\r
+      System.out.println("The generated URL:");\r
+      System.out.println(((String[]) url[3])[0]);\r
+    }\r
+  }\r
+\r
+  public static void main(String argv[])\r
+  {\r
+    String[] links = new String[]\r
+    {\r
+        "EnVision2|IDS|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Enfin%20Default%20Workflow&datasetName=linkInDatasetFromJalview&input=$SEQUENCEIDS$&inputType=0|,",\r
+        "EnVision2|Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Enfin%20Default%20Workflow&datasetName=linkInDatasetFromJalview&input=$SEQUENCES$&inputType=1|,",\r
+        "EnVision2|IDS|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Enfin%20Default%20Workflow&datasetName=$DATASETID$&input=$SEQUENCEIDS$&inputType=0|,",\r
+        "EnVision2|Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Enfin%20Default%20Workflow&datasetName=$DATASETID$&input=$SEQUENCES$&inputType=1|,",\r
+        "EnVision2|IDS|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=$SEQUENCEIDS$&datasetName=linkInDatasetFromJalview&input=$SEQUENCEIDS$&inputType=0|,",\r
+        "EnVision2|Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=$SEQUENCEIDS$&datasetName=$DATASETID$&input=$SEQUENCES$&inputType=1|,",\r
+        "EnVision2 Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Default&datasetName=JalviewSeqs$DATASETID$&input=$SEQUENCES=/([a-zA-Z]+)/=$&inputType=1|,",\r
+        "EnVision2 Seqs|http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?workflow=Default&datasetName=JalviewSeqs$DATASETID$&input=$SEQUENCES=/[A-Za-z]+/=$&inputType=1|,"\r
+    /*\r
+     * http://www.ebi.ac.uk/enfin-srv/envision2/pages/linkin.jsf?input=P38389,P38398\r
+     * &inputType=0&workflow=Enfin%20Default%20Workflow&datasetName=\r
+     * linkInDatasetFromPRIDE\r
+     */\r
+    };\r
+\r
+    SequenceI[] seqs = new SequenceI[]\r
+    { new Sequence("StupidLabel:gi|9234|pdb|102L|A",\r
+            "asdiasdpasdpadpwpadasdpaspdw"), };\r
+    String[][] seqsandids = formStrings(seqs);\r
+    for (int i = 0; i < links.length; i++)\r
+    {\r
+      GroupUrlLink ul = new GroupUrlLink(links[i]);\r
+      if (ul.isValid())\r
+      {\r
+        System.out.println("\n\n\n");\r
+        System.out.println("Link " + i + " " + links[i] + " : "\r
+                + ul.toString());\r
+        System.out.println(" pref : " + ul.getUrl_prefix());\r
+        System.out.println(" IdReplace : " + ul.getIDRegexReplace());\r
+        System.out.println(" SeqReplace : " + ul.getSeqRegexReplace());\r
+        System.out.println(" Suffixes : " + ul.getUrl_suffix());\r
+\r
+        System.out\r
+                .println("<insert input id and sequence strings here> Without onlyIfMatches:");\r
+        Object[] urls = ul.makeUrls(seqsandids[0], seqsandids[1],\r
+                "mydataset", false);\r
+        testUrls(ul, seqsandids, urls);\r
+        System.out\r
+                .println("<insert input id and sequence strings here> With onlyIfMatches set:");\r
+        urls = ul.makeUrls(seqsandids[0], seqsandids[1], "mydataset", true);\r
+        testUrls(ul, seqsandids, urls);\r
+      }\r
+      else\r
+      {\r
+        System.err.println("Invalid URLLink : " + links[i] + " : "\r
+                + ul.getInvalidMessage());\r
+      }\r
+    }\r
+  }\r
+\r
+  /**\r
+   * covenience method to generate the id and sequence string vector from a set\r
+   * of seuqences using each sequence's getName() and getSequenceAsString()\r
+   * method\r
+   * \r
+   * @param seqs\r
+   * @return String[][] {{sequence ids},{sequence strings}}\r
+   */\r
+  public static String[][] formStrings(SequenceI[] seqs)\r
+  {\r
+    String[][] idset = new String[2][seqs.length];\r
+    for (int i = 0; i < seqs.length; i++)\r
+    {\r
+      idset[0][i] = seqs[i].getName();\r
+      idset[1][i] = seqs[i].getSequenceAsString();\r
+    }\r
+    return idset;\r
+  }\r
+\r
+  public void setLabel(String newlabel)\r
+  {\r
+    this.label = newlabel;\r
+  }\r
+\r
+\r
+}\r
author	jprocter <Jim Procter>
	Fri, 26 Mar 2010 14:31:59 +0000 (14:31 +0000)
committer	jprocter <Jim Procter>
	Fri, 26 Mar 2010 14:31:59 +0000 (14:31 +0000)