+++ /dev/null
-/*
- * This file is part of TISEAN
- *
- * Copyright (c) 1998-2007 Rainer Hegger, Holger Kantz, Thomas Schreiber
- *
- * TISEAN is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or
- * (at your option) any later version.
- *
- * TISEAN is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with TISEAN; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
- */
-/*Author: Rainer Hegger. Last modified: Mar 11, 2002 */
-#include <stdio.h>
-#include <stdlib.h>
-#include <string.h>
-#include <limits.h>
-#include "routines/tsa.h"
-#include <math.h>
-
-#define WID_STR "Fits a RBF-model to the data"
-
-char *outfile=NULL,stdo=1,MAKECAST=0;
-char *infile=NULL;
-char setdrift=1;
-int DIM=2,DELAY=1,CENTER=10,STEP=1;
-unsigned int COLUMN=1;
-unsigned int verbosity=0xff;
-long CLENGTH=1000;
-unsigned long LENGTH=ULONG_MAX,INSAMPLE=ULONG_MAX,exclude=0;
-
-double *series,*coefs;
-double varianz,interval,min;
-double **center;
-
-void show_options(char *progname)
-{
- what_i_do(progname,WID_STR);
- fprintf(stderr," Usage: %s [options]\n",progname);
- fprintf(stderr," Options:\n");
- fprintf(stderr,"Everything not being a valid option will be interpreted"
- " as a possible"
- " datafile.\nIf no datafile is given stdin is read. Just - also"
- " means stdin\n");
- fprintf(stderr,"\t-l # of data to use [default: all from file]\n");
- fprintf(stderr,"\t-x # of lines to be ignored [default: 0]\n");
- fprintf(stderr,"\t-c column to read [default: %u]\n",COLUMN);
- fprintf(stderr,"\t-m embedding dimension [default: %d]\n",DIM);
- fprintf(stderr,"\t-d delay [default: %d]\n",DELAY);
- fprintf(stderr,"\t-p number of centers [default: %d]\n",CENTER);
- fprintf(stderr,"\t-X deactivate drift [default: activated]\n");
- fprintf(stderr,"\t-s steps to forecast [default: %d]\n",STEP);
- fprintf(stderr,"\t-n # of points for insample [default: # of data]\n");
- fprintf(stderr,"\t-L steps to cast [default: none]\n");
- fprintf(stderr,"\t-o output file name [default: 'datafile'.rbf]\n");
- fprintf(stderr,"\t-V verbosity level [default: 1]\n\t\t"
- "0='only panic messages'\n\t\t"
- "1='+ input/output messages'\n");
- fprintf(stderr,"\t-h show these options\n");
- exit(0);
-}
-
-void scan_options(int n,char **in)
-{
- char *out;
-
- if ((out=check_option(in,n,'l','u')) != NULL)
- sscanf(out,"%lu",&LENGTH);
- if ((out=check_option(in,n,'x','u')) != NULL)
- sscanf(out,"%lu",&exclude);
- if ((out=check_option(in,n,'c','u')) != NULL)
- sscanf(out,"%u",&COLUMN);
- if ((out=check_option(in,n,'m','u')) != NULL)
- sscanf(out,"%u",&DIM);
- if ((out=check_option(in,n,'d','u')) != NULL)
- sscanf(out,"%u",&DELAY);
- if ((out=check_option(in,n,'p','u')) != NULL)
- sscanf(out,"%u",&CENTER);
- if ((out=check_option(in,n,'X','n')) != NULL)
- setdrift=0;
- if ((out=check_option(in,n,'s','u')) != NULL)
- sscanf(out,"%u",&STEP);
- if ((out=check_option(in,n,'V','u')) != NULL)
- sscanf(out,"%u",&verbosity);
- if ((out=check_option(in,n,'n','u')) != NULL)
- sscanf(out,"%lu",&INSAMPLE);
- if ((out=check_option(in,n,'L','u')) != NULL) {
- MAKECAST=1;
- sscanf(out,"%lu",&CLENGTH);
- }
- if ((out=check_option(in,n,'o','o')) != NULL) {
- stdo=0;
- if (strlen(out) > 0)
- outfile=out;
- }
-}
-
-double avdistance(void)
-{
- int i,j,k;
- double dist=0.0;
-
- for (i=0;i<CENTER;i++)
- for (j=0;j<CENTER;j++)
- if (i != j)
- for (k=0;k<DIM;k++)
- dist += sqr(center[i][k]-center[j][k]);
-
- return sqrt(dist/(CENTER-1)/CENTER/DIM);
-}
-
-double rbf(double *act,double *cen)
-{
- static double denum;
- double r=0;
- int i;
-
- denum=2.0*varianz*varianz;
-
- for (i=0;i<DIM;i++)
- r += sqr(*(act-i*DELAY)-cen[i]);
-
- return exp(-r/denum);
-}
-
-void drift(void)
-{
- double *force,h,h1,step=1e-2,step1;
- int i,j,k,l,d2=DIM;
-
- check_alloc(force=(double*)malloc(sizeof(double)*d2));
- for (l=0;l<20;l++) {
- for (i=0;i<CENTER;i++) {
- for (j=0;j<d2;j++) {
- force[j]=0.0;
- for (k=0;k<CENTER;k++) {
- if (k != i) {
- h=center[i][j]-center[k][j];
- force[j] += h/sqr(h)/fabs(h);
- }
- }
- }
- h=0.0;
- for (j=0;j<d2;j++)
- h += sqr(force[j]);
- step1=step/sqrt(h);
- for (j=0;j<d2;j++) {
- h1 = step1*force[j];
- if (((center[i][j]+h1) > -0.1) && ((center[i][j]+h1) < 1.1))
- center[i][j] += h1;
- }
- }
- }
- free(force);
-}
-
-void make_fit(void)
-{
- double **mat,*hcen;
- double h;
- int i,j,n,nst;
-
- check_alloc(mat=(double**)malloc(sizeof(double*)*(CENTER+1)));
- for (i=0;i<=CENTER;i++)
- check_alloc(mat[i]=(double*)malloc(sizeof(double)*(CENTER+1)));
- check_alloc(hcen=(double*)malloc(sizeof(double)*CENTER));
-
- for (i=0;i<=CENTER;i++) {
- coefs[i]=0.0;
- for (j=0;j<=CENTER;j++)
- mat[i][j]=0.0;
- }
-
- for (n=(DIM-1)*DELAY;n<INSAMPLE-STEP;n++) {
- nst=n+STEP;
- for (i=0;i<CENTER;i++)
- hcen[i]=rbf(&series[n],center[i]);
- coefs[0] += series[nst];
- mat[0][0] += 1.0;
- for (i=1;i<=CENTER;i++)
- mat[i][0] += hcen[i-1];
- for (i=1;i<=CENTER;i++) {
- coefs[i] += series[nst]*(h=hcen[i-1]);
- for (j=1;j<=i;j++)
- mat[i][j] += h*hcen[j-1];
- }
- }
-
- h=(double)(INSAMPLE-STEP-(DIM-1)*DELAY);
- for (i=0;i<=CENTER;i++) {
- coefs[i] /= h;
- for (j=0;j<=i;j++) {
- mat[i][j] /= h;
- mat[j][i]=mat[i][j];
- }
- }
-
- solvele(mat,coefs,(unsigned int)(CENTER+1));
-
- for (i=0;i<=CENTER;i++)
- free(mat[i]);
- free(mat);
- free(hcen);
-}
-
-double forecast_error(unsigned long i0,unsigned long i1)
-{
- int i,n;
- double h,error=0.0;
-
- for (n=i0+(DIM-1)*DELAY;n<i1-STEP;n++) {
- h=coefs[0];
- for (i=1;i<=CENTER;i++)
- h += coefs[i]*rbf(&series[n],center[i-1]);
- error += (series[n+STEP]-h)*(series[n+STEP]-h);
- }
-
- return sqrt(error/(i1-i0-STEP-(DIM-1)*DELAY));
-}
-
-void make_cast(FILE *out)
-{
- double *cast,new_el;
- int i,n,dim;
-
- dim=(DIM-1)*DELAY;
- check_alloc(cast=(double*)malloc(sizeof(double)*(dim+1)));
- for (i=0;i<=dim;i++)
- cast[i]=series[LENGTH-1-dim+i];
-
- for (n=0;n<CLENGTH;n++) {
- new_el=coefs[0];
- for (i=1;i<=CENTER;i++)
- new_el += coefs[i]*rbf(&cast[dim],center[i-1]);
- fprintf(out,"%e\n",new_el*interval+min);
- for (i=0;i<dim;i++)
- cast[i]=cast[i+1];
- cast[dim]=new_el;
- }
-}
-
-int main(int argc,char **argv)
-{
- char stdi=0;
- int i,j,cstep;
- double sigma,av;
- FILE *file=NULL;
-
- if (scan_help(argc,argv))
- show_options(argv[0]);
-
- scan_options(argc,argv);
-#ifndef OMIT_WHAT_I_DO
- if (verbosity&VER_INPUT)
- what_i_do(argv[0],WID_STR);
-#endif
-
- infile=search_datafile(argc,argv,&COLUMN,verbosity);
- if (infile == NULL)
- stdi=1;
-
- if (outfile == NULL) {
- if (!stdi) {
- check_alloc(outfile=(char*)calloc(strlen(infile)+5,(size_t)1));
- strcpy(outfile,infile);
- strcat(outfile,".rbf");
- }
- else {
- check_alloc(outfile=(char*)calloc((size_t)10,(size_t)1));
- strcpy(outfile,"stdin.rbf");
- }
- }
- if (!stdo)
- test_outfile(outfile);
-
- series=(double*)get_series(infile,&LENGTH,exclude,COLUMN,verbosity);
- rescale_data(series,LENGTH,&min,&interval);
- variance(series,LENGTH,&av,&varianz);
-
- if (INSAMPLE > LENGTH)
- INSAMPLE=LENGTH;
-
- if (CENTER > LENGTH)
- CENTER = LENGTH;
-
- if (MAKECAST)
- STEP=1;
-
- check_alloc(coefs=(double*)malloc(sizeof(double)*(CENTER+1)));
- check_alloc(center=(double**)malloc(sizeof(double*)*CENTER));
- for (i=0;i<CENTER;i++)
- check_alloc(center[i]=(double*)malloc(sizeof(double)*DIM));
-
- cstep=LENGTH-1-(DIM-1)*DELAY;
- for (i=0;i<CENTER;i++)
- for (j=0;j<DIM;j++)
- center[i][j]=series[(DIM-1)*DELAY-j*DELAY+(i*cstep)/(CENTER-1)];
-
- if (setdrift)
- drift();
- varianz=avdistance();
- make_fit();
-
- if (!stdo) {
- file=fopen(outfile,"w");
- if (verbosity&VER_INPUT)
- fprintf(stderr,"Opened %s for writing\n",outfile);
- fprintf(file,"#Center points used:\n");
- for (i=0;i<CENTER;i++) {
- fprintf(file,"#");
- for (j=0;j<DIM;j++)
- fprintf(file," %e",center[i][j]*interval+min);
- fprintf(file,"\n");
- }
- fprintf(file,"#variance= %e\n",varianz*interval);
- fprintf(file,"#Coefficients:\n");
- fprintf(file,"#%e\n",coefs[0]*interval+min);
- for (i=1;i<=CENTER;i++)
- fprintf(file,"#%e\n",coefs[i]*interval);
- }
- else {
- if (verbosity&VER_INPUT)
- fprintf(stderr,"Writing to stdout\n");
- fprintf(stdout,"#Center points used:\n");
- for (i=0;i<CENTER;i++) {
- fprintf(stdout,"#");
- for (j=0;j<DIM;j++)
- fprintf(stdout," %e",center[i][j]*interval+min);
- fprintf(stdout,"\n");
- }
- fprintf(stdout,"#variance= %e\n",varianz*interval);
- fprintf(stdout,"#Coefficients:\n");
- fprintf(stdout,"#%e\n",coefs[0]*interval+min);
- for (i=1;i<=CENTER;i++)
- fprintf(stdout,"#%e\n",coefs[i]*interval);
- }
- av=sigma=0.0;
- for (i=0;i<INSAMPLE;i++) {
- av += series[i];
- sigma += series[i]*series[i];
- }
- av /= INSAMPLE;
- sigma=sqrt(fabs(sigma/INSAMPLE-av*av));
- if (!stdo)
- fprintf(file,"#insample error= %e\n",forecast_error(0LU,INSAMPLE)/sigma);
- else
- fprintf(stdout,"#insample error= %e\n",forecast_error(0LU,INSAMPLE)/sigma);
-
- if (INSAMPLE < LENGTH) {
- av=sigma=0.0;
- for (i=INSAMPLE;i<LENGTH;i++) {
- av += series[i];
- sigma += series[i]*series[i];
- }
- av /= (LENGTH-INSAMPLE);
- sigma=sqrt(fabs(sigma/(LENGTH-INSAMPLE)-av*av));
- if (!stdout)
- fprintf(file,"#out of sample error= %e\n",
- forecast_error(INSAMPLE,LENGTH)/sigma);
- else
- fprintf(stdout,"#out of sample error= %e\n",
- forecast_error(INSAMPLE,LENGTH)/sigma);
- }
-
- if (MAKECAST) {
- if (!stdo)
- make_cast(file);
- else
- make_cast(stdout);
- }
-
- if (!stdo)
- fclose(file);
-
- return 0;
-}