12 #if RND // by D.Mathog
13 static void generateRndSeq( char *seq, int len )
17 *seq++ = (int)( rnd() * n20or4or2 );
24 static void vec_init( Fukusosuu *result, int nlen )
28 result->R = result->I = 0.0;
34 static void vec_init2( Fukusosuu **result, char *seq, double eff, int st, int ed )
37 for( i=st; i<ed; i++ )
38 result[(int)*seq++][i].R += eff;
42 static void seq_vec_2( Fukusosuu *result, double *score, double incr, char *seq )
45 for( ; *seq; result++ )
47 n = amino_n[(int)*seq++];
48 if( n < 20 && n >= 0 ) result->R += incr * score[n];
50 fprintf( stderr, "n=%d, score=%f, inc=%f R=%f\n",n, score[n], incr * score[n], result->R );
55 static void seq_vec_3( Fukusosuu **result, double incr, char *seq )
61 n = amino_n[(int)*seq++];
62 if( n < n20or4or2 && n >= 0 ) result[n][i].R += incr;
66 static void seq_vec_5( Fukusosuu *result, double *score1, double *score2, double incr, char *seq )
69 for( ; *seq; result++ )
71 n = amino_n[(int)*seq++];
72 if( n > 20 ) continue;
73 result->R += incr * score1[n];
74 result->I += incr * score2[n];
76 fprintf( stderr, "n=%d, score=%f, inc=%f R=%f\n",n, score[n], incr * score[n], result->R );
82 static void seq_vec_4( Fukusosuu *result, double incr, char *seq )
85 for( ; *seq; result++ )
100 static void seq_vec( Fukusosuu *result, char query, double incr, char *seq )
107 if( *seq++ == query ) result->R += incr;
110 fprintf( stderr, "i = %d result->R = %f\n", bk-nlen, (result-1)->R );
115 static int checkRepeat( int num, int *cutpos )
122 if( ( tmp = *cutpos++ ) < buf ) return( 1 );
128 static int segcmp( void *ptr1, void *ptr2 )
131 Segment **seg1 = (Segment **)ptr1;
132 Segment **seg2 = (Segment **)ptr2;
134 return( (*seg1)->center - (*seg2)->center );
136 diff = (*seg1)->center - (*seg2)->center;
137 if( diff ) return( diff );
139 diff = (*seg1)->start - (*seg2)->start;
140 if( diff ) return( diff );
142 diff = (*seg1)->end - (*seg2)->end;
143 if( diff ) return( diff );
145 fprintf( stderr, "USE STABLE SORT !!\n" );
153 static void mymergesort( int first, int last, Segment **seg )
156 static int i, j, k, p;
158 static Segment **work = NULL;
162 if( work ) free( work );
163 work = (Segment **)calloc( allo / 2 + 1, sizeof( Segment *) );
168 middle = ( first + last ) / 2;
169 mymergesort( first, middle, seg );
170 mymergesort( middle+1, last, seg );
172 for( i=first; i<=middle; i++ ) work[p++] = seg[i];
173 i = middle + 1; j = 0; k = first;
174 while( i <= last && j < p )
176 if( work[j]->center <= seg[i]->center )
177 seg[k++] = work[j++];
181 while( j < p ) seg[k++] = work[j++];
186 double Fgetlag( char **seq1, char **seq2,
187 double *eff1, double *eff2,
188 int clus1, int clus2,
192 int nlen, nlen2, nlen4;
193 static int crossscoresize = 0;
194 static char **tmpseq1 = NULL;
195 static char **tmpseq2 = NULL;
196 static char **tmpptr1 = NULL;
197 static char **tmpptr2 = NULL;
198 static char **tmpres1 = NULL;
199 static char **tmpres2 = NULL;
200 static char **result1 = NULL;
201 static char **result2 = NULL;
203 static char **rndseq1 = NULL;
204 static char **rndseq2 = NULL;
206 static Fukusosuu **seqVector1 = NULL;
207 static Fukusosuu **seqVector2 = NULL;
208 static Fukusosuu **naiseki = NULL;
209 static Fukusosuu *naisekiNoWa = NULL;
210 static double *soukan = NULL;
211 static double **crossscore = NULL;
213 static int *kouho = NULL;
214 static Segment *segment = NULL;
215 static Segment *segment1 = NULL;
216 static Segment *segment2 = NULL;
217 static Segment **sortedseg1 = NULL;
218 static Segment **sortedseg2 = NULL;
219 static int *cut1 = NULL;
220 static int *cut2 = NULL;
221 static int localalloclen = 0;
229 len1 = strlen( seq1[0] );
230 len2 = strlen( seq2[0] );
231 nlentmp = MAX( len1, len2 );
234 while( nlentmp >= nlen ) nlen <<= 1;
236 fprintf( stderr, "### nlen = %d\n", nlen );
239 nlen2 = nlen/2; nlen4 = nlen2 / 2;
242 fprintf( stderr, "len1 = %d, len2 = %d\n", len1, len2 );
243 fprintf( stderr, "nlentmp = %d, nlen = %d\n", nlentmp, nlen );
248 kouho = AllocateIntVec( NKOUHO );
249 cut1 = AllocateIntVec( MAXSEG );
250 cut2 = AllocateIntVec( MAXSEG );
251 tmpptr1 = AllocateCharMtx( njob, 0 );
252 tmpptr2 = AllocateCharMtx( njob, 0 );
253 result1 = AllocateCharMtx( njob, alloclen );
254 result2 = AllocateCharMtx( njob, alloclen );
255 tmpres1 = AllocateCharMtx( njob, alloclen );
256 tmpres2 = AllocateCharMtx( njob, alloclen );
257 // crossscore = AllocateDoubleMtx( MAXSEG, MAXSEG );
258 segment = (Segment *)calloc( MAXSEG, sizeof( Segment ) );
259 segment1 = (Segment *)calloc( MAXSEG, sizeof( Segment ) );
260 segment2 = (Segment *)calloc( MAXSEG, sizeof( Segment ) );
261 sortedseg1 = (Segment **)calloc( MAXSEG, sizeof( Segment * ) );
262 sortedseg2 = (Segment **)calloc( MAXSEG, sizeof( Segment * ) );
263 if( !( segment && segment1 && segment2 && sortedseg1 && sortedseg2 ) )
264 ErrorExit( "Allocation error\n" );
266 if ( scoremtx == -1 ) n20or4or2 = 4;
267 else if( fftscore == 1 ) n20or4or2 = 2;
270 if( localalloclen < nlen )
275 FreeFukusosuuMtx ( seqVector1 );
276 FreeFukusosuuMtx ( seqVector2 );
277 FreeFukusosuuVec( naisekiNoWa );
278 FreeFukusosuuMtx( naiseki );
279 FreeDoubleVec( soukan );
280 FreeCharMtx( tmpseq1 );
281 FreeCharMtx( tmpseq2 );
284 FreeCharMtx( rndseq1 );
285 FreeCharMtx( rndseq2 );
290 tmpseq1 = AllocateCharMtx( njob, nlen );
291 tmpseq2 = AllocateCharMtx( njob, nlen );
292 naisekiNoWa = AllocateFukusosuuVec( nlen );
293 naiseki = AllocateFukusosuuMtx( n20or4or2, nlen );
294 seqVector1 = AllocateFukusosuuMtx( n20or4or2+1, nlen+1 );
295 seqVector2 = AllocateFukusosuuMtx( n20or4or2+1, nlen+1 );
296 soukan = AllocateDoubleVec( nlen+1 );
299 rndseq1 = AllocateCharMtx( njob, nlen );
300 rndseq2 = AllocateCharMtx( njob, nlen );
301 for( i=0; i<njob; i++ )
303 generateRndSeq( rndseq1[i], nlen );
304 generateRndSeq( rndseq2[i], nlen );
307 localalloclen = nlen;
310 for( j=0; j<clus1; j++ ) strcpy( tmpseq1[j], seq1[j] );
311 for( j=0; j<clus2; j++ ) strcpy( tmpseq2[j], seq2[j] );
314 fftfp = fopen( "input_of_Falign", "w" );
315 fprintf( fftfp, "nlen = %d\n", nlen );
316 fprintf( fftfp, "seq1: ( %d sequences ) \n", clus1 );
317 for( i=0; i<clus1; i++ )
318 fprintf( fftfp, "%s\n", seq1[i] );
319 fprintf( fftfp, "seq2: ( %d sequences ) \n", clus2 );
320 for( i=0; i<clus2; i++ )
321 fprintf( fftfp, "%s\n", seq2[i] );
323 system( "less input_of_Falign < /dev/tty > /dev/tty" );
326 if( fftkeika ) fprintf( stderr, " FFT ... " );
328 for( j=0; j<n20or4or2; j++ ) vec_init( seqVector1[j], nlen );
329 if( fftscore && scoremtx != -1 )
331 for( i=0; i<clus1; i++ )
333 seq_vec_2( seqVector1[0], polarity, eff1[i], tmpseq1[i] );
334 seq_vec_2( seqVector1[1], volume, eff1[i], tmpseq1[i] );
340 for( i=0; i<clus1; i++ ) for( j=0; j<n20or4or2; j++ )
341 seq_vec( seqVector1[j], amino[j], eff1[i], tmpseq1[i] );
343 for( i=0; i<clus1; i++ )
344 seq_vec_3( seqVector1, eff1[i], tmpseq1[i] );
348 for( i=0; i<clus1; i++ )
350 vec_init2( seqVector1, rndseq1[i], eff1[i], len1, nlen );
354 fftfp = fopen( "seqVec", "w" );
355 fprintf( fftfp, "before transform\n" );
356 for( k=0; k<n20or4or2; k++ )
358 fprintf( fftfp, "nlen=%d\n", nlen );
359 fprintf( fftfp, "%c\n", amino[k] );
360 for( l=0; l<nlen; l++ )
361 fprintf( fftfp, "%f %f\n", seqVector1[k][l].R, seqVector1[k][l].I );
364 system( "less seqVec < /dev/tty > /dev/tty" );
367 for( j=0; j<n20or4or2; j++ ) vec_init( seqVector2[j], nlen );
368 if( fftscore && scoremtx != -1 )
370 for( i=0; i<clus2; i++ )
372 seq_vec_2( seqVector2[0], polarity, eff2[i], tmpseq2[i] );
373 seq_vec_2( seqVector2[1], volume, eff2[i], tmpseq2[i] );
379 for( i=0; i<clus2; i++ ) for( j=0; j<n20or4or2; j++ )
380 seq_vec( seqVector2[j], amino[j], eff2[i], tmpseq2[i] );
382 for( i=0; i<clus2; i++ )
383 seq_vec_3( seqVector2, eff2[i], tmpseq2[i] );
387 for( i=0; i<clus2; i++ )
389 vec_init2( seqVector2, rndseq2[i], eff2[i], len2, nlen );
394 fftfp = fopen( "seqVec2", "w" );
395 fprintf( fftfp, "before fft\n" );
396 for( k=0; k<n20or4or2; k++ )
398 fprintf( fftfp, "%c\n", amino[k] );
399 for( l=0; l<nlen; l++ )
400 fprintf( fftfp, "%f %f\n", seqVector2[k][l].R, seqVector2[k][l].I );
403 system( "less seqVec2 < /dev/tty > /dev/tty" );
406 for( j=0; j<n20or4or2; j++ )
408 fft( nlen, seqVector2[j], (j==0) );
409 fft( nlen, seqVector1[j], 0 );
412 fftfp = fopen( "seqVec2", "w" );
413 fprintf( fftfp, "#after fft\n" );
414 for( k=0; k<n20or4or2; k++ )
416 fprintf( fftfp, "#%c\n", amino[k] );
417 for( l=0; l<nlen; l++ )
418 fprintf( fftfp, "%f %f\n", seqVector2[k][l].R, seqVector2[k][l].I );
421 system( "less seqVec2 < /dev/tty > /dev/tty" );
424 for( k=0; k<n20or4or2; k++ )
426 for( l=0; l<nlen; l++ )
427 calcNaiseki( naiseki[k]+l, seqVector1[k]+l, seqVector2[k]+l );
429 for( l=0; l<nlen; l++ )
431 naisekiNoWa[l].R = 0.0;
432 naisekiNoWa[l].I = 0.0;
433 for( k=0; k<n20or4or2; k++ )
435 naisekiNoWa[l].R += naiseki[k][l].R;
436 naisekiNoWa[l].I += naiseki[k][l].I;
441 fftfp = fopen( "naisekiNoWa", "w" );
442 fprintf( fftfp, "#Before fft\n" );
443 for( l=0; l<nlen; l++ )
444 fprintf( fftfp, "%d %f %f\n", l, naisekiNoWa[l].R, naisekiNoWa[l].I );
446 system( "less naisekiNoWa < /dev/tty > /dev/tty " );
449 fft( -nlen, naisekiNoWa, 0 );
451 for( m=0; m<=nlen2; m++ )
452 soukan[m] = naisekiNoWa[nlen2-m].R;
453 for( m=nlen2+1; m<nlen; m++ )
454 soukan[m] = naisekiNoWa[nlen+nlen2-m].R;
457 fftfp = fopen( "naisekiNoWa", "w" );
458 fprintf( fftfp, "#After fft\n" );
459 for( l=0; l<nlen; l++ )
460 fprintf( fftfp, "%d %f\n", l, naisekiNoWa[l].R );
462 fftfp = fopen( "list.plot", "w" );
463 fprintf( fftfp, "plot 'naisekiNoWa'\npause -1" );
465 system( "/usr/bin/gnuplot list.plot &" );
468 fprintf( stderr, "frt write start\n" );
469 fftfp = fopen( "frt", "w" );
470 for( l=0; l<nlen; l++ )
471 fprintf( fftfp, "%d %f\n", l-nlen2, soukan[l] );
473 system( "less frt < /dev/tty > /dev/tty" );
475 fftfp = fopen( "list.plot", "w" );
476 fprintf( fftfp, "plot 'frt'\n pause +1" );
478 system( "/usr/bin/gnuplot list.plot" );
483 getKouho( kouho, NKOUHO, soukan, nlen );
486 for( i=0; i<NKOUHO; i++ )
488 fprintf( stdout, "kouho[%d] = %d\n", i, kouho[i] );
493 fprintf( stderr, "Searching anchors ... " );
501 fftfp = fopen( "cand", "w" );
505 for( k=0; k<NKOUHO; k++ )
509 zurasu2( lag, clus1, clus2, seq1, seq2, tmpptr1, tmpptr2 );
511 fftfp = fopen( "cand", "a" );
512 fprintf( fftfp, ">Candidate No.%d lag = %d\n", k+1, lag );
513 fprintf( fftfp, "%s\n", tmpptr1[0] );
514 fprintf( fftfp, ">Candidate No.%d lag = %d\n", k+1, lag );
515 fprintf( fftfp, "%s\n", tmpptr2[0] );
516 fprintf( fftfp, ">\n", k+1, lag );
519 tmpint = alignableReagion( clus1, clus2, tmpptr1, tmpptr2, eff1, eff2, segment+count );
521 if( count+tmpint > MAXSEG -3 ) ErrorExit( "TOO MANY SEGMENTS.\n" );
524 if( tmpint == 0 ) break; // 060430 iinoka ?
525 while( tmpint-- > 0 )
529 segment1[count].start = segment[count].start ;
530 segment1[count].end = segment[count].end ;
531 segment1[count].center = segment[count].center;
532 segment1[count].score = segment[count].score;
534 segment2[count].start = segment[count].start + lag;
535 segment2[count].end = segment[count].end + lag;
536 segment2[count].center = segment[count].center + lag;
537 segment2[count].score = segment[count].score ;
541 segment1[count].start = segment[count].start - lag;
542 segment1[count].end = segment[count].end - lag;
543 segment1[count].center = segment[count].center - lag;
544 segment1[count].score = segment[count].score ;
546 segment2[count].start = segment[count].start ;
547 segment2[count].end = segment[count].end ;
548 segment2[count].center = segment[count].center;
549 segment2[count].score = segment[count].score ;
552 fprintf( stderr, "Goukaku=%dko\n", tmpint );
553 fprintf( stderr, "in 1 %d\n", segment1[count].center );
554 fprintf( stderr, "in 2 %d\n", segment2[count].center );
556 segment1[count].pair = &segment2[count];
557 segment2[count].pair = &segment1[count];
560 fprintf( stderr, "count=%d\n", count );
566 fprintf( stderr, "done. (%d anchors)\r", count );
568 if( !count && fftNoAnchStop )
569 ErrorExit( "Cannot detect anchor!" );
571 fprintf( stdout, "RESULT before sort:\n" );
572 for( l=0; l<count+1; l++ )
574 fprintf( stdout, "cut[%d]=%d, ", l, segment1[l].center );
575 fprintf( stdout, "%d score = %f\n", segment2[l].center, segment1[l].score );
581 fprintf( stderr, "Aligning anchors ... " );
583 for( i=0; i<count; i++ )
585 sortedseg1[i] = &segment1[i];
586 sortedseg2[i] = &segment2[i];
590 mymergesort( 0, count-1, sortedseg1 );
591 mymergesort( 0, count-1, sortedseg2 );
592 for( i=0; i<count; i++ ) sortedseg1[i]->number = i;
593 for( i=0; i<count; i++ ) sortedseg2[i]->number = i;
595 if( crossscoresize < count+2 )
597 crossscoresize = count+2;
598 fprintf( stderr, "####################################################################################################################################allocating crossscore, size = %d\n", crossscoresize );
599 if( crossscore ) FreeDoubleMtx( crossscore );
600 crossscore = AllocateDoubleMtx( crossscoresize, crossscoresize );
603 for( i=0; i<count+2; i++ ) for( j=0; j<count+2; j++ )
604 crossscore[i][j] = 0.0;
605 for( i=0; i<count; i++ )
607 crossscore[segment1[i].number+1][segment1[i].pair->number+1] = segment1[i].score;
608 cut1[i+1] = sortedseg1[i]->center;
609 cut2[i+1] = sortedseg2[i]->center;
613 fprintf( stderr, "AFTER SORT\n" );
614 for( i=0; i<count; i++ ) fprintf( stderr, "%d, %d\n", segment1[i].start, segment2[i].start );
617 crossscore[0][0] = 10000000.0;
620 crossscore[count+1][count+1] = 10000000.0;
621 cut1[count+1] = len1;
622 cut2[count+1] = len2;
626 blockAlign2( cut1, cut2, sortedseg1, sortedseg2, crossscore, &count );
632 fprintf( stderr, "REPEAT!? \n" );
633 if( fftRepeatStop ) exit( 1 );
637 fprintf( stderr, "done\n" );
638 fprintf( stderr, "done. (%d anchors)\n", count );
643 fftfp = fopen( "fft", "a" );
644 fprintf( fftfp, "RESULT after sort:\n" );
645 for( l=0; l<count; l++ )
647 fprintf( fftfp, "cut[%d]=%d, ", l, segment1[l].center );
648 fprintf( fftfp, "%d\n", segment2[l].center );
654 fftfp = fopen( "fft", "a" );
655 fprintf( fftfp, "RESULT after sort:\n" );
656 for( l=0; l<count; l++ )
658 fprintf( fftfp, "cut : %d %d\n", cut1[l], cut2[l] );
664 fprintf( trap_g, "Devided to %d segments\n", count-1 );
665 fprintf( trap_g, "%d %d forg\n", MIN( clus1, clus2 ), count-1 );
669 for( j=0; j<clus1; j++ ) result1[j][0] = 0;
670 for( j=0; j<clus2; j++ ) result2[j][0] = 0;
671 for( i=0; i<count-1; i++ )
674 fprintf( stderr, "DP %03d / %03d %4d to ", i+1, count-1, totallen );
677 fprintf( stderr, "DP %03d / %03d\r", i+1, count-1 );
680 for( j=0; j<clus1; j++ )
682 strncpy( tmpres1[j], seq1[j]+cut1[i], cut1[i+1]-cut1[i] );
683 tmpres1[j][cut1[i+1]-cut1[i]] = 0;
685 for( j=0; j<clus2; j++ )
687 strncpy( tmpres2[j], seq2[j]+cut2[i], cut2[i+1]-cut2[i] );
688 tmpres2[j][cut2[i+1]-cut2[i]] = 0;
693 Aalign( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen );
696 MSalignmm( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen, NULL, NULL, NULL, NULL );
699 if( clus1 == 1 && clus2 == 1 )
700 G__align11( tmpres1, tmpres2, alloclen );
702 A__align( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen, NULL, &dumfl, NULL, NULL, NULL, NULL );
705 if( clus1 == 1 && clus2 == 1 )
706 G__align11( tmpres1, tmpres2, alloclen );
708 H__align( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen, NULL, &dumfl, NULL, NULL, NULL, NULL );
711 if( clus1 == 1 && clus2 == 1 )
712 G__align11( tmpres1, tmpres2, alloclen );
714 Q__align( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen, NULL, &dumfl, NULL, NULL, NULL, NULL );
717 fprintf( stderr, "alg = %c\n", alg );
718 ErrorExit( "ERROR IN SOURCE FILE Falign.c" );
722 nlen = strlen( tmpres1[0] );
723 if( totallen + nlen > alloclen ) ErrorExit( "LENGTH OVER in Falign\n " );
724 for( j=0; j<clus1; j++ ) strcat( result1[j], tmpres1[j] );
725 for( j=0; j<clus2; j++ ) strcat( result2[j], tmpres2[j] );
728 fprintf( stderr, "%4d\r", totallen );
729 fprintf( stderr, "\n\n" );
730 for( j=0; j<clus1; j++ )
732 fprintf( stderr, "%s\n", tmpres1[j] );
734 fprintf( stderr, "-------\n" );
735 for( j=0; j<clus2; j++ )
737 fprintf( stderr, "%s\n", tmpres2[j] );
742 fprintf( stderr, "DP ... done \n" );
745 for( j=0; j<clus1; j++ ) strcpy( seq1[j], result1[j] );
746 for( j=0; j<clus2; j++ ) strcpy( seq2[j], result2[j] );
748 for( j=0; j<clus1; j++ )
750 fprintf( stderr, "%s\n", result1[j] );
752 fprintf( stderr, "- - - - - - - - - - -\n" );
753 for( j=0; j<clus2; j++ )
755 fprintf( stderr, "%s\n", result2[j] );
764 float Falign( char **seq1, char **seq2,
765 double *eff1, double *eff2,
766 int clus1, int clus2,
767 int alloclen, int *fftlog )
769 int i, j, k, l, m, maxk;
770 int nlen, nlen2, nlen4;
771 static int prevalloclen = 0;
772 static int crossscoresize = 0;
773 static char **tmpseq1 = NULL;
774 static char **tmpseq2 = NULL;
775 static char **tmpptr1 = NULL;
776 static char **tmpptr2 = NULL;
777 static char **tmpres1 = NULL;
778 static char **tmpres2 = NULL;
779 static char **result1 = NULL;
780 static char **result2 = NULL;
782 static char **rndseq1 = NULL;
783 static char **rndseq2 = NULL;
785 static Fukusosuu **seqVector1 = NULL;
786 static Fukusosuu **seqVector2 = NULL;
787 static Fukusosuu **naiseki = NULL;
788 static Fukusosuu *naisekiNoWa = NULL;
789 static double *soukan = NULL;
790 static double **crossscore = NULL;
792 static int *kouho = NULL;
793 static Segment *segment = NULL;
794 static Segment *segment1 = NULL;
795 static Segment *segment2 = NULL;
796 static Segment **sortedseg1 = NULL;
797 static Segment **sortedseg2 = NULL;
798 static int *cut1 = NULL;
799 static int *cut2 = NULL;
800 static char *sgap1, *egap1, *sgap2, *egap2;
801 static int localalloclen = 0;
811 len1 = strlen( seq1[0] );
812 len2 = strlen( seq2[0] );
813 nlentmp = MAX( len1, len2 );
816 while( nlentmp >= nlen ) nlen <<= 1;
818 fprintf( stderr, "### nlen = %d\n", nlen );
821 nlen2 = nlen/2; nlen4 = nlen2 / 2;
824 fprintf( stderr, "len1 = %d, len2 = %d\n", len1, len2 );
825 fprintf( stderr, "nlentmp = %d, nlen = %d\n", nlentmp, nlen );
828 if( prevalloclen != alloclen ) // Falign_noudp mo kaeru
832 FreeCharMtx( result1 );
833 FreeCharMtx( result2 );
834 FreeCharMtx( tmpres1 );
835 FreeCharMtx( tmpres2 );
837 // fprintf( stderr, "\n\n\nreallocating ...\n" );
838 result1 = AllocateCharMtx( njob, alloclen );
839 result2 = AllocateCharMtx( njob, alloclen );
840 tmpres1 = AllocateCharMtx( njob, alloclen );
841 tmpres2 = AllocateCharMtx( njob, alloclen );
842 prevalloclen = alloclen;
846 sgap1 = AllocateCharVec( njob );
847 egap1 = AllocateCharVec( njob );
848 sgap2 = AllocateCharVec( njob );
849 egap2 = AllocateCharVec( njob );
850 kouho = AllocateIntVec( NKOUHO );
851 cut1 = AllocateIntVec( MAXSEG );
852 cut2 = AllocateIntVec( MAXSEG );
853 tmpptr1 = AllocateCharMtx( njob, 0 );
854 tmpptr2 = AllocateCharMtx( njob, 0 );
855 // crossscore = AllocateDoubleMtx( MAXSEG, MAXSEG );
856 segment = (Segment *)calloc( MAXSEG, sizeof( Segment ) );
857 segment1 = (Segment *)calloc( MAXSEG, sizeof( Segment ) );
858 segment2 = (Segment *)calloc( MAXSEG, sizeof( Segment ) );
859 sortedseg1 = (Segment **)calloc( MAXSEG, sizeof( Segment * ) );
860 sortedseg2 = (Segment **)calloc( MAXSEG, sizeof( Segment * ) );
861 if( !( segment && segment1 && segment2 && sortedseg1 && sortedseg2 ) )
862 ErrorExit( "Allocation error\n" );
864 if ( scoremtx == -1 ) n20or4or2 = 1;
865 else if( fftscore ) n20or4or2 = 1;
868 if( localalloclen < nlen )
873 if( !kobetsubunkatsu )
875 FreeFukusosuuMtx ( seqVector1 );
876 FreeFukusosuuMtx ( seqVector2 );
877 FreeFukusosuuVec( naisekiNoWa );
878 FreeFukusosuuMtx( naiseki );
879 FreeDoubleVec( soukan );
881 FreeCharMtx( tmpseq1 );
882 FreeCharMtx( tmpseq2 );
885 FreeCharMtx( rndseq1 );
886 FreeCharMtx( rndseq2 );
890 tmpseq1 = AllocateCharMtx( njob, nlen );
891 tmpseq2 = AllocateCharMtx( njob, nlen );
892 if( !kobetsubunkatsu )
894 naisekiNoWa = AllocateFukusosuuVec( nlen );
895 naiseki = AllocateFukusosuuMtx( n20or4or2, nlen );
896 seqVector1 = AllocateFukusosuuMtx( n20or4or2+1, nlen+1 );
897 seqVector2 = AllocateFukusosuuMtx( n20or4or2+1, nlen+1 );
898 soukan = AllocateDoubleVec( nlen+1 );
901 rndseq1 = AllocateCharMtx( njob, nlen );
902 rndseq2 = AllocateCharMtx( njob, nlen );
903 for( i=0; i<njob; i++ )
905 generateRndSeq( rndseq1[i], nlen );
906 generateRndSeq( rndseq2[i], nlen );
909 localalloclen = nlen;
912 for( j=0; j<clus1; j++ ) strcpy( tmpseq1[j], seq1[j] );
913 for( j=0; j<clus2; j++ ) strcpy( tmpseq2[j], seq2[j] );
916 fftfp = fopen( "input_of_Falign", "w" );
917 fprintf( fftfp, "nlen = %d\n", nlen );
918 fprintf( fftfp, "seq1: ( %d sequences ) \n", clus1 );
919 for( i=0; i<clus1; i++ )
920 fprintf( fftfp, "%s\n", seq1[i] );
921 fprintf( fftfp, "seq2: ( %d sequences ) \n", clus2 );
922 for( i=0; i<clus2; i++ )
923 fprintf( fftfp, "%s\n", seq2[i] );
925 system( "less input_of_Falign < /dev/tty > /dev/tty" );
927 if( !kobetsubunkatsu )
929 if( fftkeika ) fprintf( stderr, " FFT ... " );
931 for( j=0; j<n20or4or2; j++ ) vec_init( seqVector1[j], nlen );
932 if( fftscore && scoremtx != -1 )
934 for( i=0; i<clus1; i++ )
937 seq_vec_5( seqVector1[0], polarity, volume, eff1[i], tmpseq1[i] );
939 seq_vec_2( seqVector1[0], polarity, eff1[i], tmpseq1[i] );
940 seq_vec_2( seqVector1[1], volume, eff1[i], tmpseq1[i] );
947 for( i=0; i<clus1; i++ ) for( j=0; j<n20or4or2; j++ )
948 seq_vec( seqVector1[j], amino[j], eff1[i], tmpseq1[i] );
950 for( i=0; i<clus1; i++ )
951 seq_vec_3( seqVector1, eff1[i], tmpseq1[i] );
955 for( i=0; i<clus1; i++ )
957 vec_init2( seqVector1, rndseq1[i], eff1[i], len1, nlen );
961 fftfp = fopen( "seqVec", "w" );
962 fprintf( fftfp, "before transform\n" );
963 for( k=0; k<n20or4or2; k++ )
965 fprintf( fftfp, "nlen=%d\n", nlen );
966 fprintf( fftfp, "%c\n", amino[k] );
967 for( l=0; l<nlen; l++ )
968 fprintf( fftfp, "%f %f\n", seqVector1[k][l].R, seqVector1[k][l].I );
971 system( "less seqVec < /dev/tty > /dev/tty" );
974 for( j=0; j<n20or4or2; j++ ) vec_init( seqVector2[j], nlen );
975 if( fftscore && scoremtx != -1 )
977 for( i=0; i<clus2; i++ )
980 seq_vec_5( seqVector2[0], polarity, volume, eff2[i], tmpseq2[i] );
982 seq_vec_2( seqVector2[0], polarity, eff2[i], tmpseq2[i] );
983 seq_vec_2( seqVector2[1], volume, eff2[i], tmpseq2[i] );
990 for( i=0; i<clus2; i++ ) for( j=0; j<n20or4or2; j++ )
991 seq_vec( seqVector2[j], amino[j], eff2[i], tmpseq2[i] );
993 for( i=0; i<clus2; i++ )
994 seq_vec_3( seqVector2, eff2[i], tmpseq2[i] );
998 for( i=0; i<clus2; i++ )
1000 vec_init2( seqVector2, rndseq2[i], eff2[i], len2, nlen );
1005 fftfp = fopen( "seqVec2", "w" );
1006 fprintf( fftfp, "before fft\n" );
1007 for( k=0; k<n20or4or2; k++ )
1009 fprintf( fftfp, "%c\n", amino[k] );
1010 for( l=0; l<nlen; l++ )
1011 fprintf( fftfp, "%f %f\n", seqVector2[k][l].R, seqVector2[k][l].I );
1014 system( "less seqVec2 < /dev/tty > /dev/tty" );
1017 for( j=0; j<n20or4or2; j++ )
1019 fft( nlen, seqVector2[j], (j==0) );
1020 fft( nlen, seqVector1[j], 0 );
1023 fftfp = fopen( "seqVec2", "w" );
1024 fprintf( fftfp, "#after fft\n" );
1025 for( k=0; k<n20or4or2; k++ )
1027 fprintf( fftfp, "#%c\n", amino[k] );
1028 for( l=0; l<nlen; l++ )
1029 fprintf( fftfp, "%f %f\n", seqVector2[k][l].R, seqVector2[k][l].I );
1032 system( "less seqVec2 < /dev/tty > /dev/tty" );
1035 for( k=0; k<n20or4or2; k++ )
1037 for( l=0; l<nlen; l++ )
1038 calcNaiseki( naiseki[k]+l, seqVector1[k]+l, seqVector2[k]+l );
1040 for( l=0; l<nlen; l++ )
1042 naisekiNoWa[l].R = 0.0;
1043 naisekiNoWa[l].I = 0.0;
1044 for( k=0; k<n20or4or2; k++ )
1046 naisekiNoWa[l].R += naiseki[k][l].R;
1047 naisekiNoWa[l].I += naiseki[k][l].I;
1052 fftfp = fopen( "naisekiNoWa", "w" );
1053 fprintf( fftfp, "#Before fft\n" );
1054 for( l=0; l<nlen; l++ )
1055 fprintf( fftfp, "%d %f %f\n", l, naisekiNoWa[l].R, naisekiNoWa[l].I );
1057 system( "less naisekiNoWa < /dev/tty > /dev/tty " );
1060 fft( -nlen, naisekiNoWa, 0 );
1062 for( m=0; m<=nlen2; m++ )
1063 soukan[m] = naisekiNoWa[nlen2-m].R;
1064 for( m=nlen2+1; m<nlen; m++ )
1065 soukan[m] = naisekiNoWa[nlen+nlen2-m].R;
1068 fftfp = fopen( "naisekiNoWa", "w" );
1069 fprintf( fftfp, "#After fft\n" );
1070 for( l=0; l<nlen; l++ )
1071 fprintf( fftfp, "%d %f\n", l, naisekiNoWa[l].R );
1073 fftfp = fopen( "list.plot", "w" );
1074 fprintf( fftfp, "plot 'naisekiNoWa'\npause -1" );
1076 system( "/usr/bin/gnuplot list.plot &" );
1079 fprintf( stderr, "soukan\n" );
1080 for( l=0; l<nlen; l++ )
1081 fprintf( stderr, "%d %f\n", l-nlen2, soukan[l] );
1083 fftfp = fopen( "list.plot", "w" );
1084 fprintf( fftfp, "plot 'frt'\n pause +1" );
1086 system( "/usr/bin/gnuplot list.plot" );
1091 getKouho( kouho, NKOUHO, soukan, nlen );
1094 for( i=0; i<NKOUHO; i++ )
1096 fprintf( stderr, "kouho[%d] = %d\n", i, kouho[i] );
1102 fprintf( stderr, "Searching anchors ... " );
1110 fftfp = fopen( "cand", "w" );
1113 if( kobetsubunkatsu )
1123 for( k=0; k<maxk; k++ )
1126 if( lag <= -len1 || len2 <= lag ) continue;
1127 zurasu2( lag, clus1, clus2, seq1, seq2, tmpptr1, tmpptr2 );
1129 fftfp = fopen( "cand", "a" );
1130 fprintf( fftfp, ">Candidate No.%d lag = %d\n", k+1, lag );
1131 fprintf( fftfp, "%s\n", tmpptr1[0] );
1132 fprintf( fftfp, ">Candidate No.%d lag = %d\n", k+1, lag );
1133 fprintf( fftfp, "%s\n", tmpptr2[0] );
1134 fprintf( fftfp, ">\n", k+1, lag );
1138 // fprintf( stderr, "lag = %d\n", lag );
1139 tmpint = alignableReagion( clus1, clus2, tmpptr1, tmpptr2, eff1, eff2, segment+count );
1141 // if( lag == -50 ) exit( 1 );
1143 if( count+tmpint > MAXSEG -3 ) ErrorExit( "TOO MANY SEGMENTS.\n" );
1146 if( tmpint == 0 ) break; // 060430 iinoka ?
1147 while( tmpint-- > 0 )
1150 if( segment[count].end - segment[count].start < fftWinSize )
1158 segment1[count].start = segment[count].start ;
1159 segment1[count].end = segment[count].end ;
1160 segment1[count].center = segment[count].center;
1161 segment1[count].score = segment[count].score;
1163 segment2[count].start = segment[count].start + lag;
1164 segment2[count].end = segment[count].end + lag;
1165 segment2[count].center = segment[count].center + lag;
1166 segment2[count].score = segment[count].score ;
1170 segment1[count].start = segment[count].start - lag;
1171 segment1[count].end = segment[count].end - lag;
1172 segment1[count].center = segment[count].center - lag;
1173 segment1[count].score = segment[count].score ;
1175 segment2[count].start = segment[count].start ;
1176 segment2[count].end = segment[count].end ;
1177 segment2[count].center = segment[count].center;
1178 segment2[count].score = segment[count].score ;
1181 fprintf( stderr, "in 1 %d\n", segment1[count].center );
1182 fprintf( stderr, "in 2 %d\n", segment2[count].center );
1184 segment1[count].pair = &segment2[count];
1185 segment2[count].pair = &segment1[count];
1190 if( !kobetsubunkatsu && fftkeika )
1191 fprintf( stderr, "%d anchors found\r", count );
1193 if( !count && fftNoAnchStop )
1194 ErrorExit( "Cannot detect anchor!" );
1196 fprintf( stderr, "RESULT before sort:\n" );
1197 for( l=0; l<count+1; l++ )
1199 fprintf( stderr, "cut[%d]=%d, ", l, segment1[l].center );
1200 fprintf( stderr, "%d score = %f\n", segment2[l].center, segment1[l].score );
1205 fprintf( stderr, "done. (%d anchors)\n", count );
1206 fprintf( stderr, "Aligning anchors ... " );
1208 for( i=0; i<count; i++ )
1210 sortedseg1[i] = &segment1[i];
1211 sortedseg2[i] = &segment2[i];
1214 tmpsort( count, sortedseg1 );
1215 tmpsort( count, sortedseg2 );
1216 qsort( sortedseg1, count, sizeof( Segment * ), segcmp );
1217 qsort( sortedseg2, count, sizeof( Segment * ), segcmp );
1219 mymergesort( 0, count-1, sortedseg1 );
1220 mymergesort( 0, count-1, sortedseg2 );
1222 for( i=0; i<count; i++ ) sortedseg1[i]->number = i;
1223 for( i=0; i<count; i++ ) sortedseg2[i]->number = i;
1226 if( kobetsubunkatsu )
1228 for( i=0; i<count; i++ )
1230 cut1[i+1] = sortedseg1[i]->center;
1231 cut2[i+1] = sortedseg2[i]->center;
1235 cut1[count+1] = len1;
1236 cut2[count+1] = len2;
1241 if( crossscoresize < count+2 )
1243 crossscoresize = count+2;
1245 if( fftkeika ) fprintf( stderr, "######allocating crossscore, size = %d\n", crossscoresize );
1247 if( crossscore ) FreeDoubleMtx( crossscore );
1248 crossscore = AllocateDoubleMtx( crossscoresize, crossscoresize );
1250 for( i=0; i<count+2; i++ ) for( j=0; j<count+2; j++ )
1251 crossscore[i][j] = 0.0;
1252 for( i=0; i<count; i++ )
1254 crossscore[segment1[i].number+1][segment1[i].pair->number+1] = segment1[i].score;
1255 cut1[i+1] = sortedseg1[i]->center;
1256 cut2[i+1] = sortedseg2[i]->center;
1260 fprintf( stderr, "AFTER SORT\n" );
1261 for( i=0; i<count+1; i++ ) fprintf( stderr, "%d, %d\n", cut1[i], cut2[i] );
1262 fprintf( stderr, "crossscore = \n" );
1263 for( i=0; i<count+1; i++ )
1265 for( j=0; j<count+1; j++ )
1266 fprintf( stderr, "%.0f ", crossscore[i][j] );
1267 fprintf( stderr, "\n" );
1271 crossscore[0][0] = 10000000.0;
1274 crossscore[count+1][count+1] = 10000000.0;
1275 cut1[count+1] = len1;
1276 cut2[count+1] = len2;
1280 blockAlign2( cut1, cut2, sortedseg1, sortedseg2, crossscore, &count );
1282 // if( count-count0 )
1283 // fprintf( stderr, "%d unused anchors\n", count0-count );
1285 if( !kobetsubunkatsu && fftkeika )
1286 fprintf( stderr, "%d anchors found\n", count );
1289 if( count0 > count )
1292 fprintf( stderr, "\7 REPEAT!? \n" );
1294 fprintf( stderr, "REPEAT!? \n" );
1296 if( fftRepeatStop ) exit( 1 );
1299 else fprintf( stderr, "done\n" );
1305 fftfp = fopen( "fft", "a" );
1306 fprintf( fftfp, "RESULT after sort:\n" );
1307 for( l=0; l<count; l++ )
1309 fprintf( fftfp, "cut[%d]=%d, ", l, segment1[l].center );
1310 fprintf( fftfp, "%d\n", segment2[l].center );
1316 fprintf( stderr, "RESULT after blckalign:\n" );
1317 for( l=0; l<count+1; l++ )
1319 fprintf( stderr, "cut : %d %d\n", cut1[l], cut2[l] );
1324 fprintf( trap_g, "Devided to %d segments\n", count-1 );
1325 fprintf( trap_g, "%d %d forg\n", MIN( clus1, clus2 ), count-1 );
1329 for( j=0; j<clus1; j++ ) result1[j][0] = 0;
1330 for( j=0; j<clus2; j++ ) result2[j][0] = 0;
1333 for( i=0; i<count-1; i++ )
1337 if( cut1[i] ) // chuui
1339 // getkyokaigap( sgap1, tmpres1, nlen-1, clus1 );
1340 // getkyokaigap( sgap2, tmpres2, nlen-1, clus2 );
1341 getkyokaigap( sgap1, tmpres1, nlen-1, clus1 );
1342 getkyokaigap( sgap2, tmpres2, nlen-1, clus2 );
1346 for( j=0; j<clus1; j++ ) sgap1[j] = 'o';
1347 for( j=0; j<clus2; j++ ) sgap2[j] = 'o';
1349 if( cut1[i+1] != len1 ) // chuui
1351 getkyokaigap( egap1, seq1, cut1[i+1], clus1 );
1352 getkyokaigap( egap2, seq2, cut2[i+1], clus2 );
1356 for( j=0; j<clus1; j++ ) egap1[j] = 'o';
1357 for( j=0; j<clus2; j++ ) egap2[j] = 'o';
1361 fprintf( stderr, "kyokkaigap1(%d)=", cut1[i]-1 );
1362 for( j=0; j<clus1; j++ )
1363 fprintf( stderr, "%c", sgap1[j] );
1364 fprintf( stderr, "=kyokkaigap1-start\n" );
1367 fprintf( stderr, "kyokkaigap2(%d)=", cut2[i]-1 );
1368 for( j=0; j<clus2; j++ )
1369 fprintf( stderr, "%c", sgap2[j] );
1370 fprintf( stderr, "=kyokkaigap2-start\n" );
1373 fprintf( stderr, "kyokkaigap1(%d)=", cut1[i]-1 );
1374 for( j=0; j<clus1; j++ )
1375 fprintf( stderr, "%c", egap1[j] );
1376 fprintf( stderr, "=kyokkaigap1-end\n" );
1379 fprintf( stderr, "kyokkaigap2(%d)=", cut2[i]-1 );
1380 for( j=0; j<clus2; j++ )
1381 fprintf( stderr, "%c", egap2[j] );
1382 fprintf( stderr, "=kyokkaigap2-end\n" );
1387 fprintf( stderr, "DP %03d / %03d %4d to ", i+1, count-1, totallen );
1390 fprintf( stderr, "DP %03d / %03d\r", i+1, count-1 );
1393 for( j=0; j<clus1; j++ )
1395 strncpy( tmpres1[j], seq1[j]+cut1[i], cut1[i+1]-cut1[i] );
1396 tmpres1[j][cut1[i+1]-cut1[i]] = 0;
1398 if( kobetsubunkatsu && fftkeika ) commongappick( clus1, tmpres1 ); //dvtditr
\e$B$K8F$P$l$?$H$-
\e(B fftkeika=1
1399 // if( kobetsubunkatsu ) commongappick( clus1, tmpres1 );
1400 for( j=0; j<clus2; j++ )
1402 strncpy( tmpres2[j], seq2[j]+cut2[i], cut2[i+1]-cut2[i] );
1403 tmpres2[j][cut2[i+1]-cut2[i]] = 0;
1405 if( kobetsubunkatsu && fftkeika ) commongappick( clus2, tmpres2 ); //dvtditr
\e$B$K8F$P$l$?$H$-
\e(B fftkeika=1
1406 // if( kobetsubunkatsu ) commongappick( clus2, tmpres2 );
1410 fprintf( stderr, "Not supported\n" );
1414 fprintf( stderr, "i=%d, before alignment", i );
1415 fprintf( stderr, "%4d\n", totallen );
1416 fprintf( stderr, "\n\n" );
1417 for( j=0; j<clus1; j++ )
1419 fprintf( stderr, "%s\n", tmpres1[j] );
1421 fprintf( stderr, "-------\n" );
1422 for( j=0; j<clus2; j++ )
1424 fprintf( stderr, "%s\n", tmpres2[j] );
1429 fprintf( stdout, "writing input\n" );
1430 for( j=0; j<clus1; j++ )
1432 fprintf( stdout, ">%d of GROUP1\n", j );
1433 fprintf( stdout, "%s\n", tmpres1[j] );
1435 for( j=0; j<clus2; j++ )
1437 fprintf( stdout, ">%d of GROUP2\n", j );
1438 fprintf( stdout, "%s\n", tmpres2[j] );
1445 totalscore += Aalign( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen );
1448 totalscore += MSalignmm( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen, sgap1, sgap2, egap1, egap2 );
1451 if( clus1 == 1 && clus2 == 1 )
1453 totalscore += G__align11( tmpres1, tmpres2, alloclen );
1456 totalscore += A__align( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen, NULL, &dumfl, sgap1, sgap2, egap1, egap2 );
1459 if( clus1 == 1 && clus2 == 1 )
1461 totalscore += G__align11( tmpres1, tmpres2, alloclen );
1464 totalscore += H__align( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen, NULL, &dumfl, sgap1, sgap2, egap1, egap2 );
1467 if( clus1 == 1 && clus2 == 1 )
1469 totalscore += G__align11( tmpres1, tmpres2, alloclen );
1472 totalscore += Q__align( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen, NULL, &dumfl, sgap1, sgap2, egap1, egap2 );
1475 fprintf( stderr, "alg = %c\n", alg );
1476 ErrorExit( "ERROR IN SOURCE FILE Falign.c" );
1480 nlen = strlen( tmpres1[0] );
1481 if( totallen + nlen > alloclen )
1483 fprintf( stderr, "totallen=%d + nlen=%d > alloclen = %d\n", totallen, nlen, alloclen );
1484 ErrorExit( "LENGTH OVER in Falign\n " );
1486 for( j=0; j<clus1; j++ ) strcat( result1[j], tmpres1[j] );
1487 for( j=0; j<clus2; j++ ) strcat( result2[j], tmpres2[j] );
1490 fprintf( stderr, "i=%d", i );
1491 fprintf( stderr, "%4d\n", totallen );
1492 fprintf( stderr, "\n\n" );
1493 for( j=0; j<clus1; j++ )
1495 fprintf( stderr, "%s\n", tmpres1[j] );
1497 fprintf( stderr, "-------\n" );
1498 for( j=0; j<clus2; j++ )
1500 fprintf( stderr, "%s\n", tmpres2[j] );
1505 fprintf( stderr, "DP ... done \n" );
1508 for( j=0; j<clus1; j++ ) strcpy( seq1[j], result1[j] );
1509 for( j=0; j<clus2; j++ ) strcpy( seq2[j], result2[j] );
1511 for( j=0; j<clus1; j++ )
1513 fprintf( stderr, "%s\n", result1[j] );
1515 fprintf( stderr, "- - - - - - - - - - -\n" );
1516 for( j=0; j<clus2; j++ )
1518 fprintf( stderr, "%s\n", result2[j] );
1521 return( totalscore );
1532 float Falign_udpari_long( char **seq1, char **seq2,
1533 double *eff1, double *eff2,
1534 int clus1, int clus2,
1535 int alloclen, int *fftlog )
1537 int i, j, k, l, m, maxk;
1538 int nlen, nlen2, nlen4;
1539 static int prevalloclen = 0;
1540 static int crossscoresize = 0;
1541 static char **tmpseq1 = NULL;
1542 static char **tmpseq2 = NULL;
1543 static char **tmpptr1 = NULL;
1544 static char **tmpptr2 = NULL;
1545 static char **tmpres1 = NULL;
1546 static char **tmpres2 = NULL;
1547 static char **result1 = NULL;
1548 static char **result2 = NULL;
1550 static char **rndseq1 = NULL;
1551 static char **rndseq2 = NULL;
1553 static Fukusosuu **seqVector1 = NULL;
1554 static Fukusosuu **seqVector2 = NULL;
1555 static Fukusosuu **naiseki = NULL;
1556 static Fukusosuu *naisekiNoWa = NULL;
1557 static double *soukan = NULL;
1558 static double **crossscore = NULL;
1560 static int *kouho = NULL;
1561 static Segment *segment = NULL;
1562 static Segment *segment1 = NULL;
1563 static Segment *segment2 = NULL;
1564 static Segment **sortedseg1 = NULL;
1565 static Segment **sortedseg2 = NULL;
1566 static int *cut1 = NULL;
1567 static int *cut2 = NULL;
1568 static char *sgap1, *egap1, *sgap2, *egap2;
1569 static int localalloclen = 0;
1577 // float dumfl = 0.0;
1580 len1 = strlen( seq1[0] );
1581 len2 = strlen( seq2[0] );
1582 nlentmp = MAX( len1, len2 );
1585 while( nlentmp >= nlen ) nlen <<= 1;
1587 fprintf( stderr, "### nlen = %d\n", nlen );
1590 nlen2 = nlen/2; nlen4 = nlen2 / 2;
1593 fprintf( stderr, "len1 = %d, len2 = %d\n", len1, len2 );
1594 fprintf( stderr, "nlentmp = %d, nlen = %d\n", nlentmp, nlen );
1597 if( prevalloclen != alloclen ) // Falign_noudp mo kaeru
1601 FreeCharMtx( result1 );
1602 FreeCharMtx( result2 );
1603 FreeCharMtx( tmpres1 );
1604 FreeCharMtx( tmpres2 );
1606 // fprintf( stderr, "\n\n\nreallocating ...\n" );
1607 result1 = AllocateCharMtx( njob, alloclen );
1608 result2 = AllocateCharMtx( njob, alloclen );
1609 tmpres1 = AllocateCharMtx( njob, alloclen );
1610 tmpres2 = AllocateCharMtx( njob, alloclen );
1611 prevalloclen = alloclen;
1614 if( !localalloclen )
1616 sgap1 = AllocateCharVec( njob );
1617 egap1 = AllocateCharVec( njob );
1618 sgap2 = AllocateCharVec( njob );
1619 egap2 = AllocateCharVec( njob );
1620 kouho = AllocateIntVec( NKOUHO_LONG );
1621 cut1 = AllocateIntVec( MAXSEG );
1622 cut2 = AllocateIntVec( MAXSEG );
1623 tmpptr1 = AllocateCharMtx( njob, 0 );
1624 tmpptr2 = AllocateCharMtx( njob, 0 );
1625 segment = (Segment *)calloc( MAXSEG, sizeof( Segment ) );
1626 segment1 = (Segment *)calloc( MAXSEG, sizeof( Segment ) );
1627 segment2 = (Segment *)calloc( MAXSEG, sizeof( Segment ) );
1628 sortedseg1 = (Segment **)calloc( MAXSEG, sizeof( Segment * ) );
1629 sortedseg2 = (Segment **)calloc( MAXSEG, sizeof( Segment * ) );
1630 if( !( segment && segment1 && segment2 && sortedseg1 && sortedseg2 ) )
1631 ErrorExit( "Allocation error\n" );
1633 if ( scoremtx == -1 ) n20or4or2 = 1;
1634 else if( fftscore ) n20or4or2 = 1;
1635 else n20or4or2 = 20;
1637 if( localalloclen < nlen )
1642 if( !kobetsubunkatsu )
1644 FreeFukusosuuMtx ( seqVector1 );
1645 FreeFukusosuuMtx ( seqVector2 );
1646 FreeFukusosuuVec( naisekiNoWa );
1647 FreeFukusosuuMtx( naiseki );
1648 FreeDoubleVec( soukan );
1650 FreeCharMtx( tmpseq1 );
1651 FreeCharMtx( tmpseq2 );
1654 FreeCharMtx( rndseq1 );
1655 FreeCharMtx( rndseq2 );
1660 tmpseq1 = AllocateCharMtx( njob, nlen );
1661 tmpseq2 = AllocateCharMtx( njob, nlen );
1662 if( !kobetsubunkatsu )
1664 naisekiNoWa = AllocateFukusosuuVec( nlen );
1665 naiseki = AllocateFukusosuuMtx( n20or4or2, nlen );
1666 seqVector1 = AllocateFukusosuuMtx( n20or4or2, nlen+1 );
1667 seqVector2 = AllocateFukusosuuMtx( n20or4or2, nlen+1 );
1668 soukan = AllocateDoubleVec( nlen+1 );
1671 rndseq1 = AllocateCharMtx( njob, nlen );
1672 rndseq2 = AllocateCharMtx( njob, nlen );
1673 for( i=0; i<njob; i++ )
1675 generateRndSeq( rndseq1[i], nlen );
1676 generateRndSeq( rndseq2[i], nlen );
1679 localalloclen = nlen;
1682 for( j=0; j<clus1; j++ ) strcpy( tmpseq1[j], seq1[j] );
1683 for( j=0; j<clus2; j++ ) strcpy( tmpseq2[j], seq2[j] );
1686 fftfp = fopen( "input_of_Falign", "w" );
1687 fprintf( fftfp, "nlen = %d\n", nlen );
1688 fprintf( fftfp, "seq1: ( %d sequences ) \n", clus1 );
1689 for( i=0; i<clus1; i++ )
1690 fprintf( fftfp, "%s\n", seq1[i] );
1691 fprintf( fftfp, "seq2: ( %d sequences ) \n", clus2 );
1692 for( i=0; i<clus2; i++ )
1693 fprintf( fftfp, "%s\n", seq2[i] );
1695 system( "less input_of_Falign < /dev/tty > /dev/tty" );
1697 if( !kobetsubunkatsu )
1699 fprintf( stderr, " FFT ... " );
1701 for( j=0; j<n20or4or2; j++ ) vec_init( seqVector1[j], nlen );
1702 if( scoremtx == -1 )
1704 for( i=0; i<clus1; i++ )
1705 seq_vec_4( seqVector1[0], eff1[i], tmpseq1[i] );
1709 for( i=0; i<clus1; i++ )
1712 seq_vec_2( seqVector1[0], polarity, eff1[i], tmpseq1[i] );
1713 seq_vec_2( seqVector1[1], volume, eff1[i], tmpseq1[i] );
1715 seq_vec_5( seqVector1[0], polarity, volume, eff1[i], tmpseq1[i] );
1721 for( i=0; i<clus1; i++ )
1722 seq_vec_3( seqVector1, eff1[i], tmpseq1[i] );
1725 for( i=0; i<clus1; i++ )
1727 vec_init2( seqVector1, rndseq1[i], eff1[i], len1, nlen );
1731 fftfp = fopen( "seqVec", "w" );
1732 fprintf( fftfp, "before transform\n" );
1733 for( k=0; k<n20or4or2; k++ )
1735 fprintf( fftfp, "nlen=%d\n", nlen );
1736 fprintf( fftfp, "%c\n", amino[k] );
1737 for( l=0; l<nlen; l++ )
1738 fprintf( fftfp, "%f %f\n", seqVector1[k][l].R, seqVector1[k][l].I );
1741 system( "less seqVec < /dev/tty > /dev/tty" );
1744 for( j=0; j<n20or4or2; j++ ) vec_init( seqVector2[j], nlen );
1745 if( scoremtx == -1 )
1747 for( i=0; i<clus2; i++ )
1748 seq_vec_4( seqVector2[0], eff2[i], tmpseq2[i] );
1752 for( i=0; i<clus2; i++ )
1755 seq_vec_2( seqVector2[0], polarity, eff2[i], tmpseq2[i] );
1756 seq_vec_2( seqVector2[1], volume, eff2[i], tmpseq2[i] );
1758 seq_vec_5( seqVector2[0], polarity, volume, eff2[i], tmpseq2[i] );
1764 for( i=0; i<clus2; i++ )
1765 seq_vec_3( seqVector2, eff2[i], tmpseq2[i] );
1768 for( i=0; i<clus2; i++ )
1770 vec_init2( seqVector2, rndseq2[i], eff2[i], len2, nlen );
1775 fftfp = fopen( "seqVec2", "w" );
1776 fprintf( fftfp, "before fft\n" );
1777 for( k=0; k<n20or4or2; k++ )
1779 fprintf( fftfp, "%c\n", amino[k] );
1780 for( l=0; l<nlen; l++ )
1781 fprintf( fftfp, "%f %f\n", seqVector2[k][l].R, seqVector2[k][l].I );
1784 system( "less seqVec2 < /dev/tty > /dev/tty" );
1787 for( j=0; j<n20or4or2; j++ )
1789 fft( nlen, seqVector2[j], (j==0) );
1790 fft( nlen, seqVector1[j], 0 );
1793 fftfp = fopen( "seqVec2", "w" );
1794 fprintf( fftfp, "#after fft\n" );
1795 for( k=0; k<n20or4or2; k++ )
1797 fprintf( fftfp, "#%c\n", amino[k] );
1798 for( l=0; l<nlen; l++ )
1799 fprintf( fftfp, "%f %f\n", seqVector2[k][l].R, seqVector2[k][l].I );
1802 system( "less seqVec2 < /dev/tty > /dev/tty" );
1805 for( k=0; k<n20or4or2; k++ )
1807 for( l=0; l<nlen; l++ )
1808 calcNaiseki( naiseki[k]+l, seqVector1[k]+l, seqVector2[k]+l );
1810 for( l=0; l<nlen; l++ )
1812 naisekiNoWa[l].R = 0.0;
1813 naisekiNoWa[l].I = 0.0;
1814 for( k=0; k<n20or4or2; k++ )
1816 naisekiNoWa[l].R += naiseki[k][l].R;
1817 naisekiNoWa[l].I += naiseki[k][l].I;
1822 fftfp = fopen( "naisekiNoWa", "w" );
1823 fprintf( fftfp, "#Before fft\n" );
1824 for( l=0; l<nlen; l++ )
1825 fprintf( fftfp, "%d %f %f\n", l, naisekiNoWa[l].R, naisekiNoWa[l].I );
1827 system( "less naisekiNoWa < /dev/tty > /dev/tty " );
1830 fft( -nlen, naisekiNoWa, 0 );
1832 for( m=0; m<=nlen2; m++ )
1833 soukan[m] = naisekiNoWa[nlen2-m].R;
1834 for( m=nlen2+1; m<nlen; m++ )
1835 soukan[m] = naisekiNoWa[nlen+nlen2-m].R;
1838 fftfp = fopen( "naisekiNoWa", "w" );
1839 fprintf( fftfp, "#After fft\n" );
1840 for( l=0; l<nlen; l++ )
1841 fprintf( fftfp, "%d %f\n", l, naisekiNoWa[l].R );
1843 fftfp = fopen( "list.plot", "w" );
1844 fprintf( fftfp, "plot 'naisekiNoWa'\npause -1" );
1846 system( "/usr/bin/gnuplot list.plot &" );
1849 fprintf( stderr, "soukan\n" );
1850 for( l=0; l<nlen; l++ )
1851 fprintf( stderr, "%d %f\n", l-nlen2, soukan[l] );
1853 fftfp = fopen( "list.plot", "w" );
1854 fprintf( fftfp, "plot 'frt'\n pause +1" );
1856 system( "/usr/bin/gnuplot list.plot" );
1861 nkouho = getKouho( kouho, NKOUHO_LONG, soukan, nlen );
1864 for( i=0; i<nkouho; i++ )
1866 fprintf( stderr, "kouho[%d] = %d\n", i, kouho[i] );
1872 fprintf( stderr, "Searching anchors ... " );
1880 fftfp = fopen( "cand", "w" );
1883 if( kobetsubunkatsu )
1893 for( k=0; k<maxk; k++ )
1896 if( lag <= -len1 || len2 <= lag ) continue;
1897 // fprintf( stderr, "k=%d, lag=%d\n", k, lag );
1898 zurasu2( lag, clus1, clus2, seq1, seq2, tmpptr1, tmpptr2 );
1900 fftfp = fopen( "cand", "a" );
1901 fprintf( fftfp, ">Candidate No.%d lag = %d\n", k+1, lag );
1902 fprintf( fftfp, "%s\n", tmpptr1[0] );
1903 fprintf( fftfp, ">Candidate No.%d lag = %d\n", k+1, lag );
1904 fprintf( fftfp, "%s\n", tmpptr2[0] );
1905 fprintf( fftfp, ">\n", k+1, lag );
1909 // fprintf( stderr, "lag = %d\n", lag );
1910 tmpint = alignableReagion( clus1, clus2, tmpptr1, tmpptr2, eff1, eff2, segment+count );
1911 // fprintf( stderr, "lag = %d, %d found\n", lag, tmpint );
1913 // if( lag == -50 ) exit( 1 );
1915 if( count+tmpint > MAXSEG -3 ) ErrorExit( "TOO MANY SEGMENTS.\n" );
1917 // fprintf( stderr, "##### k=%d / %d\n", k, maxk );
1918 // if( tmpint == 0 ) break; // 060430 iinoka ? // 090530 yameta
1919 while( tmpint-- > 0 )
1922 if( segment[count].end - segment[count].start < fftWinSize )
1930 segment1[count].start = segment[count].start ;
1931 segment1[count].end = segment[count].end ;
1932 segment1[count].center = segment[count].center;
1933 segment1[count].score = segment[count].score;
1935 segment2[count].start = segment[count].start + lag;
1936 segment2[count].end = segment[count].end + lag;
1937 segment2[count].center = segment[count].center + lag;
1938 segment2[count].score = segment[count].score ;
1942 segment1[count].start = segment[count].start - lag;
1943 segment1[count].end = segment[count].end - lag;
1944 segment1[count].center = segment[count].center - lag;
1945 segment1[count].score = segment[count].score ;
1947 segment2[count].start = segment[count].start ;
1948 segment2[count].end = segment[count].end ;
1949 segment2[count].center = segment[count].center;
1950 segment2[count].score = segment[count].score ;
1953 fprintf( stderr, "##### k=%d / %d\n", k, maxk );
1954 fprintf( stderr, "anchor %d, score = %f\n", count, segment1[count].score );
1955 fprintf( stderr, "in 1 %d\n", segment1[count].center );
1956 fprintf( stderr, "in 2 %d\n", segment2[count].center );
1958 segment1[count].pair = &segment2[count];
1959 segment2[count].pair = &segment1[count];
1962 fprintf( stderr, "count=%d\n", count );
1967 if( !kobetsubunkatsu )
1968 fprintf( stderr, "done. (%d anchors) ", count );
1970 if( !count && fftNoAnchStop )
1971 ErrorExit( "Cannot detect anchor!" );
1973 fprintf( stderr, "RESULT before sort:\n" );
1974 for( l=0; l<count+1; l++ )
1976 fprintf( stderr, "cut[%d]=%d, ", l, segment1[l].center );
1977 fprintf( stderr, "%d score = %f\n", segment2[l].center, segment1[l].score );
1981 for( i=0; i<count; i++ )
1983 sortedseg1[i] = &segment1[i];
1984 sortedseg2[i] = &segment2[i];
1987 tmpsort( count, sortedseg1 );
1988 tmpsort( count, sortedseg2 );
1989 qsort( sortedseg1, count, sizeof( Segment * ), segcmp );
1990 qsort( sortedseg2, count, sizeof( Segment * ), segcmp );
1992 mymergesort( 0, count-1, sortedseg1 );
1993 mymergesort( 0, count-1, sortedseg2 );
1995 for( i=0; i<count; i++ ) sortedseg1[i]->number = i;
1996 for( i=0; i<count; i++ ) sortedseg2[i]->number = i;
2000 if( kobetsubunkatsu )
2002 for( i=0; i<count; i++ )
2004 cut1[i+1] = sortedseg1[i]->center;
2005 cut2[i+1] = sortedseg2[i]->center;
2009 cut1[count+1] = len1;
2010 cut2[count+1] = len2;
2018 if( crossscoresize < count+2 )
2020 crossscoresize = count+2;
2022 if( fftkeika ) fprintf( stderr, "######allocating crossscore, size = %d\n", crossscoresize );
2024 if( crossscore ) FreeDoubleMtx( crossscore );
2025 crossscore = AllocateDoubleMtx( crossscoresize, crossscoresize );
2027 for( i=0; i<count+2; i++ ) for( j=0; j<count+2; j++ )
2028 crossscore[i][j] = 0.0;
2029 for( i=0; i<count; i++ )
2031 crossscore[segment1[i].number+1][segment1[i].pair->number+1] = segment1[i].score;
2032 cut1[i+1] = sortedseg1[i]->center;
2033 cut2[i+1] = sortedseg2[i]->center;
2037 fprintf( stderr, "AFTER SORT\n" );
2038 for( i=0; i<count+1; i++ ) fprintf( stderr, "%d, %d\n", cut1[i], cut2[i] );
2039 fprintf( stderr, "crossscore = \n" );
2040 for( i=0; i<count+1; i++ )
2042 for( j=0; j<count+1; j++ )
2043 fprintf( stderr, "%.0f ", crossscore[i][j] );
2044 fprintf( stderr, "\n" );
2048 crossscore[0][0] = 10000000.0;
2051 crossscore[count+1][count+1] = 10000000.0;
2052 cut1[count+1] = len1;
2053 cut2[count+1] = len2;
2057 // fprintf( stderr, "\n\n\ncalling blockAlign2\n\n\n\n" );
2058 blockAlign2( cut1, cut2, sortedseg1, sortedseg2, crossscore, &count );
2060 // if( count-count0 )
2061 // fprintf( stderr, "%d unused anchors\n", count0-count );
2063 if( !kobetsubunkatsu && fftkeika )
2064 fprintf( stderr, "%d anchors found\n", count );
2067 if( count0 > count )
2070 fprintf( stderr, "\7 REPEAT!? \n" );
2072 fprintf( stderr, "REPEAT!? \n" );
2074 if( fftRepeatStop ) exit( 1 );
2077 else fprintf( stderr, "done\n" );
2085 fprintf( stderr, "\nMany anchors were found. The upper-level DP is skipped.\n\n" );
2090 for( i=0; i<count; i++ )
2092 // fprintf( stderr, "i=%d, %d-%d ?\n", i, sortedseg1[i]->center, sortedseg1[i]->pair->center );
2093 if( sortedseg1[i]->center > cut1[count0]
2094 && sortedseg1[i]->pair->center > cut2[count0] )
2097 cut1[count0] = sortedseg1[i]->center;
2098 cut2[count0] = sortedseg1[i]->pair->center;
2102 if( i && sortedseg1[i]->score > sortedseg1[i-1]->score )
2104 if( sortedseg1[i]->center > cut1[count0-1]
2105 && sortedseg1[i]->pair->center > cut2[count0-1] )
2107 cut1[count0] = sortedseg1[i]->center;
2108 cut2[count0] = sortedseg1[i]->pair->center;
2117 // if( count-count0 )
2118 // fprintf( stderr, "%d anchors unused\n", count-count0 );
2119 cut1[count0+1] = len1;
2120 cut2[count0+1] = len2;
2130 fftfp = fopen( "fft", "a" );
2131 fprintf( fftfp, "RESULT after sort:\n" );
2132 for( l=0; l<count; l++ )
2134 fprintf( fftfp, "cut[%d]=%d, ", l, segment1[l].center );
2135 fprintf( fftfp, "%d\n", segment2[l].center );
2141 fprintf( stderr, "RESULT after blckalign:\n" );
2142 for( l=0; l<count+1; l++ )
2144 fprintf( stderr, "cut : %d %d\n", cut1[l], cut2[l] );
2149 fprintf( trap_g, "Devided to %d segments\n", count-1 );
2150 fprintf( trap_g, "%d %d forg\n", MIN( clus1, clus2 ), count-1 );
2154 for( j=0; j<clus1; j++ ) result1[j][0] = 0;
2155 for( j=0; j<clus2; j++ ) result2[j][0] = 0;
2158 for( i=0; i<count-1; i++ )
2164 // getkyokaigap( sgap1, seq1, cut1[i]-1, clus1 );
2165 // getkyokaigap( sgap2, seq2, cut2[i]-1, clus2 );
2166 getkyokaigap( sgap1, tmpres1, nlen-1, clus1 );
2167 getkyokaigap( sgap2, tmpres2, nlen-1, clus2 );
2171 for( j=0; j<clus1; j++ ) sgap1[j] = 'o';
2172 for( j=0; j<clus2; j++ ) sgap2[j] = 'o';
2174 if( cut1[i+1] != len1 )
2176 getkyokaigap( egap1, seq1, cut1[i+1], clus1 );
2177 getkyokaigap( egap2, seq2, cut2[i+1], clus2 );
2181 for( j=0; j<clus1; j++ ) egap1[j] = 'o';
2182 for( j=0; j<clus2; j++ ) egap2[j] = 'o';
2185 fprintf( stderr, "DP %03d / %03d %4d to ", i+1, count-1, totallen );
2188 fprintf( stderr, "DP %05d / %05d \b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b\b", i+1, count-1 );
2191 for( j=0; j<clus1; j++ )
2193 strncpy( tmpres1[j], seq1[j]+cut1[i], cut1[i+1]-cut1[i] );
2194 tmpres1[j][cut1[i+1]-cut1[i]] = 0;
2196 if( kobetsubunkatsu && fftkeika ) commongappick( clus1, tmpres1 ); //dvtditr
\e$B$K8F$P$l$?$H$-
\e(B fftkeika=1
2197 // if( kobetsubunkatsu ) commongappick( clus1, tmpres1 );
2198 for( j=0; j<clus2; j++ )
2200 // fprintf( stderr, "### cut2[i+1]-cut2[i] = %d\n", cut2[i+1]-cut2[i] );
2201 if( cut2[i+1]-cut2[i] <= 0 )
2202 fprintf( stderr, "### cut2[i+1]=%d, cut2[i]=%d\n", cut2[i+1], cut2[i] );
2203 strncpy( tmpres2[j], seq2[j]+cut2[i], cut2[i+1]-cut2[i] );
2204 tmpres2[j][cut2[i+1]-cut2[i]] = 0;
2206 if( kobetsubunkatsu && fftkeika ) commongappick( clus2, tmpres2 ); //dvtditr
\e$B$K8F$P$l$?$H$-
\e(B fftkeika=1
2207 // if( kobetsubunkatsu ) commongappick( clus2, tmpres2 );
2211 fprintf( stderr, "Not supported\n" );
2215 fprintf( stderr, "i=%d, before alignment", i );
2216 fprintf( stderr, "%4d\n", totallen );
2217 fprintf( stderr, "\n\n" );
2218 for( j=0; j<clus1; j++ )
2220 fprintf( stderr, "%s\n", tmpres1[j] );
2222 fprintf( stderr, "-------\n" );
2223 for( j=0; j<clus2; j++ )
2225 fprintf( stderr, "%s\n", tmpres2[j] );
2230 fprintf( stdout, "writing input\n" );
2231 for( j=0; j<clus1; j++ )
2233 fprintf( stdout, ">%d of GROUP1\n", j );
2234 fprintf( stdout, "%s\n", tmpres1[j] );
2236 for( j=0; j<clus2; j++ )
2238 fprintf( stdout, ">%d of GROUP2\n", j );
2239 fprintf( stdout, "%s\n", tmpres2[j] );
2246 totalscore += MSalignmm( tmpres1, tmpres2, eff1, eff2, clus1, clus2, alloclen, sgap1, sgap2, egap1, egap2 );
2249 fprintf( stderr, "alg = %c\n", alg );
2250 ErrorExit( "ERROR IN SOURCE FILE Falign.c" );
2254 nlen = strlen( tmpres1[0] );
2255 if( totallen + nlen > alloclen )
2257 fprintf( stderr, "totallen=%d + nlen=%d > alloclen = %d\n", totallen, nlen, alloclen );
2258 ErrorExit( "LENGTH OVER in Falign\n " );
2260 for( j=0; j<clus1; j++ ) strcat( result1[j], tmpres1[j] );
2261 for( j=0; j<clus2; j++ ) strcat( result2[j], tmpres2[j] );
2264 fprintf( stderr, "i=%d", i );
2265 fprintf( stderr, "%4d\n", totallen );
2266 fprintf( stderr, "\n\n" );
2267 for( j=0; j<clus1; j++ )
2269 fprintf( stderr, "%s\n", tmpres1[j] );
2271 fprintf( stderr, "-------\n" );
2272 for( j=0; j<clus2; j++ )
2274 fprintf( stderr, "%s\n", tmpres2[j] );
2279 fprintf( stderr, "DP ... done \n" );
2282 for( j=0; j<clus1; j++ ) strcpy( seq1[j], result1[j] );
2283 for( j=0; j<clus2; j++ ) strcpy( seq2[j], result2[j] );
2285 for( j=0; j<clus1; j++ )
2287 fprintf( stderr, "%s\n", result1[j] );
2289 fprintf( stderr, "- - - - - - - - - - -\n" );
2290 for( j=0; j<clus2; j++ )
2292 fprintf( stderr, "%s\n", result2[j] );
2295 return( totalscore );