Mac binaries
[jabaws.git] / website / archive / binaries / mac / src / muscle / objscoreda.cpp
diff --git a/website/archive/binaries/mac/src/muscle/objscoreda.cpp b/website/archive/binaries/mac/src/muscle/objscoreda.cpp
new file mode 100644 (file)
index 0000000..3f2978e
--- /dev/null
@@ -0,0 +1,289 @@
+#include "muscle.h"\r
+#include "msa.h"\r
+#include "profile.h"\r
+#include "objscore.h"\r
+\r
+#if    DOUBLE_AFFINE\r
+\r
+#define TRACE                  0\r
+#define TEST_SPFAST            0\r
+\r
+static SCORE GapPenalty(unsigned uLength, bool Term, SCORE g, SCORE e)\r
+       {\r
+       //if (Term)\r
+       //      {\r
+       //      switch (g_TermGap)\r
+       //              {\r
+       //      case TERMGAP_Full:\r
+       //              return g + (uLength - 1)*e;\r
+\r
+       //      case TERMGAP_Half:\r
+       //              return g/2 + (uLength - 1)*e;\r
+\r
+       //      case TERMGAP_Ext:\r
+       //              return uLength*e;\r
+       //              }\r
+       //      Quit("Bad termgap");\r
+       //      }\r
+       //else\r
+       //      return g + (uLength - 1)*e;\r
+       //return MINUS_INFINITY;\r
+       return g + (uLength - 1)*e;\r
+       }\r
+\r
+static SCORE GapPenalty(unsigned uLength, bool Term)\r
+       {\r
+       SCORE s1 = GapPenalty(uLength, Term, g_scoreGapOpen, g_scoreGapExtend);\r
+#if    DOUBLE_AFFINE\r
+       SCORE s2 = GapPenalty(uLength, Term, g_scoreGapOpen2, g_scoreGapExtend2);\r
+       if (s1 > s2)\r
+               return s1;\r
+       return s2;\r
+#else\r
+       return s1;\r
+#endif\r
+       }\r
+\r
+static const MSA *g_ptrMSA1;\r
+static const MSA *g_ptrMSA2;\r
+static unsigned g_uSeqIndex1;\r
+static unsigned g_uSeqIndex2;\r
+\r
+static void LogGap(unsigned uStart, unsigned uEnd, unsigned uGapLength,\r
+  bool bNTerm, bool bCTerm)\r
+       {\r
+       Log("%16.16s  ", "");\r
+       for (unsigned i = 0; i < uStart; ++i)\r
+               Log(" ");\r
+       unsigned uMyLength = 0;\r
+       for (unsigned i = uStart; i <= uEnd; ++i)\r
+               {\r
+               bool bGap1 = g_ptrMSA1->IsGap(g_uSeqIndex1, i);\r
+               bool bGap2 = g_ptrMSA2->IsGap(g_uSeqIndex2, i);\r
+               if (!bGap1 && !bGap2)\r
+                       Quit("Error -- neither gapping");\r
+               if (bGap1 && bGap2)\r
+                       Log(".");\r
+               else\r
+                       {\r
+                       ++uMyLength;\r
+                       Log("-");\r
+                       }\r
+               }\r
+       SCORE s = GapPenalty(uGapLength, bNTerm || bCTerm);\r
+       Log(" L=%d N%d C%d s=%.3g", uGapLength, bNTerm, bCTerm, s);\r
+       Log("\n");\r
+       if (uMyLength != uGapLength)\r
+               Quit("Lengths differ");\r
+\r
+       }\r
+\r
+static SCORE ScoreSeqPair(const MSA &msa1, unsigned uSeqIndex1,\r
+  const MSA &msa2, unsigned uSeqIndex2, SCORE *ptrLetters, SCORE *ptrGaps)\r
+       {\r
+       g_ptrMSA1 = &msa1;\r
+       g_ptrMSA2 = &msa2;\r
+       g_uSeqIndex1 = uSeqIndex1;\r
+       g_uSeqIndex2 = uSeqIndex2;\r
+\r
+       const unsigned uColCount = msa1.GetColCount();\r
+       const unsigned uColCount2 = msa2.GetColCount();\r
+       if (uColCount != uColCount2)\r
+               Quit("ScoreSeqPair, different lengths");\r
+\r
+#if    TRACE\r
+       Log("ScoreSeqPair\n");\r
+       Log("%16.16s  ", msa1.GetSeqName(uSeqIndex1));\r
+       for (unsigned i = 0; i < uColCount; ++i)\r
+               Log("%c", msa1.GetChar(uSeqIndex1, i));\r
+       Log("\n");\r
+       Log("%16.16s  ", msa2.GetSeqName(uSeqIndex2));\r
+       for (unsigned i = 0; i < uColCount; ++i)\r
+               Log("%c", msa1.GetChar(uSeqIndex2, i));\r
+       Log("\n");\r
+#endif\r
+\r
+       SCORE scoreTotal = 0;\r
+\r
+// Substitution scores\r
+       unsigned uFirstLetter1 = uInsane;\r
+       unsigned uFirstLetter2 = uInsane;\r
+       unsigned uLastLetter1 = uInsane;\r
+       unsigned uLastLetter2 = uInsane;\r
+       for (unsigned uColIndex = 0; uColIndex < uColCount; ++uColIndex)\r
+               {\r
+               bool bGap1 = msa1.IsGap(uSeqIndex1, uColIndex);\r
+               bool bGap2 = msa2.IsGap(uSeqIndex2, uColIndex);\r
+               bool bWildcard1 = msa1.IsWildcard(uSeqIndex1, uColIndex);\r
+               bool bWildcard2 = msa2.IsWildcard(uSeqIndex2, uColIndex);\r
+\r
+               if (!bGap1)\r
+                       {\r
+                       if (uInsane == uFirstLetter1)\r
+                               uFirstLetter1 = uColIndex;\r
+                       uLastLetter1 = uColIndex;\r
+                       }\r
+               if (!bGap2)\r
+                       {\r
+                       if (uInsane == uFirstLetter2)\r
+                               uFirstLetter2 = uColIndex;\r
+                       uLastLetter2 = uColIndex;\r
+                       }\r
+\r
+               if (bGap1 || bGap2 || bWildcard1 || bWildcard2)\r
+                       continue;\r
+\r
+               unsigned uLetter1 = msa1.GetLetter(uSeqIndex1, uColIndex);\r
+               unsigned uLetter2 = msa2.GetLetter(uSeqIndex2, uColIndex);\r
+\r
+               SCORE scoreMatch = (*g_ptrScoreMatrix)[uLetter1][uLetter2];\r
+               scoreTotal += scoreMatch;\r
+#if    TRACE\r
+               Log("%c <-> %c = %7.1f  %10.1f\n",\r
+                 msa1.GetChar(uSeqIndex1, uColIndex),\r
+                 msa2.GetChar(uSeqIndex2, uColIndex),\r
+                 scoreMatch,\r
+                 scoreTotal);\r
+#endif\r
+               }\r
+       \r
+       *ptrLetters = scoreTotal;\r
+\r
+// Gap penalties\r
+       unsigned uGapLength = uInsane;\r
+       unsigned uGapStartCol = uInsane;\r
+       bool bGapping1 = false;\r
+       bool bGapping2 = false;\r
+\r
+       for (unsigned uColIndex = 0; uColIndex < uColCount; ++uColIndex)\r
+               {\r
+               bool bGap1 = msa1.IsGap(uSeqIndex1, uColIndex);\r
+               bool bGap2 = msa2.IsGap(uSeqIndex2, uColIndex);\r
+\r
+               if (bGap1 && bGap2)\r
+                       continue;\r
+\r
+               if (bGapping1)\r
+                       {\r
+                       if (bGap1)\r
+                               ++uGapLength;\r
+                       else\r
+                               {\r
+                               bGapping1 = false;\r
+                               bool bNTerm = (uFirstLetter2 == uGapStartCol);\r
+                               bool bCTerm = (uLastLetter2 + 1 == uColIndex);\r
+                               SCORE scoreGap = GapPenalty(uGapLength, bNTerm || bCTerm);\r
+                               scoreTotal += scoreGap;\r
+#if    TRACE\r
+                               LogGap(uGapStartCol, uColIndex - 1, uGapLength, bNTerm, bCTerm);\r
+                               Log("GAP         %7.1f  %10.1f\n",\r
+                                 scoreGap,\r
+                                 scoreTotal);\r
+#endif\r
+                               }\r
+                       continue;\r
+                       }\r
+               else\r
+                       {\r
+                       if (bGap1)\r
+                               {\r
+                               uGapStartCol = uColIndex;\r
+                               bGapping1 = true;\r
+                               uGapLength = 1;\r
+                               continue;\r
+                               }\r
+                       }\r
+\r
+               if (bGapping2)\r
+                       {\r
+                       if (bGap2)\r
+                               ++uGapLength;\r
+                       else\r
+                               {\r
+                               bGapping2 = false;\r
+                               bool bNTerm = (uFirstLetter1 == uGapStartCol);\r
+                               bool bCTerm = (uLastLetter1 + 1 == uColIndex);\r
+                               SCORE scoreGap = GapPenalty(uGapLength, bNTerm || bCTerm);\r
+                               scoreTotal += scoreGap;\r
+#if    TRACE\r
+                               LogGap(uGapStartCol, uColIndex - 1, uGapLength, bNTerm, bCTerm);\r
+                               Log("GAP         %7.1f  %10.1f\n",\r
+                                 scoreGap,\r
+                                 scoreTotal);\r
+#endif\r
+                               }\r
+                       }\r
+               else\r
+                       {\r
+                       if (bGap2)\r
+                               {\r
+                               uGapStartCol = uColIndex;\r
+                               bGapping2 = true;\r
+                               uGapLength = 1;\r
+                               }\r
+                       }\r
+               }\r
+\r
+       if (bGapping1 || bGapping2)\r
+               {\r
+               SCORE scoreGap = GapPenalty(uGapLength, true);\r
+               scoreTotal += scoreGap;\r
+#if    TRACE\r
+               LogGap(uGapStartCol, uColCount - 1, uGapLength, false, true);\r
+               Log("GAP         %7.1f  %10.1f\n",\r
+                 scoreGap,\r
+                 scoreTotal);\r
+#endif\r
+               }\r
+       *ptrGaps = scoreTotal - *ptrLetters;\r
+       return scoreTotal;\r
+       }\r
+\r
+// The usual sum-of-pairs objective score: sum the score\r
+// of the alignment of each pair of sequences.\r
+SCORE ObjScoreDA(const MSA &msa, SCORE *ptrLetters, SCORE *ptrGaps)\r
+       {\r
+       const unsigned uSeqCount = msa.GetSeqCount();\r
+       SCORE scoreTotal = 0;\r
+       unsigned uPairCount = 0;\r
+#if    TRACE\r
+       msa.LogMe();\r
+       Log("     Score  Weight  Weight       Total\n");\r
+       Log("----------  ------  ------  ----------\n");\r
+#endif\r
+       SCORE TotalLetters = 0;\r
+       SCORE TotalGaps = 0;\r
+       for (unsigned uSeqIndex1 = 0; uSeqIndex1 < uSeqCount; ++uSeqIndex1)\r
+               {\r
+               const WEIGHT w1 = msa.GetSeqWeight(uSeqIndex1);\r
+               for (unsigned uSeqIndex2 = uSeqIndex1 + 1; uSeqIndex2 < uSeqCount; ++uSeqIndex2)\r
+                       {\r
+                       const WEIGHT w2 = msa.GetSeqWeight(uSeqIndex2);\r
+                       const WEIGHT w = w1*w2;\r
+                       SCORE Letters;\r
+                       SCORE Gaps;\r
+                       SCORE scorePair = ScoreSeqPair(msa, uSeqIndex1, msa, uSeqIndex2,\r
+                         &Letters, &Gaps);\r
+                       scoreTotal += w1*w2*scorePair;\r
+                       TotalLetters += w1*w2*Letters;\r
+                       TotalGaps += w1*w2*Gaps;\r
+                       ++uPairCount;\r
+#if    TRACE\r
+                       Log("%10.2f  %6.3f  %6.3f  %10.2f  %d=%s %d=%s\n",\r
+                         scorePair,\r
+                         w1,\r
+                         w2,\r
+                         scorePair*w1*w2,\r
+                         uSeqIndex1,\r
+                         msa.GetSeqName(uSeqIndex1),\r
+                         uSeqIndex2,\r
+                         msa.GetSeqName(uSeqIndex2));\r
+#endif\r
+                       }\r
+               }\r
+       *ptrLetters = TotalLetters;\r
+       *ptrGaps = TotalGaps;\r
+       return scoreTotal;\r
+       }\r
+\r
+#endif // DOUBLE_AFFINE\r