src/tools/gmx_analyze.c

   1 /*  -*- mode: c; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4; c-file-style: "stroustrup"; -*-
   2  *
   3  *
   4  *                This source code is part of
   5  *
   6  *                 G   R   O   M   A   C   S
   7  *
   8  *          GROningen MAchine for Chemical Simulations
   9  *
  10  *                        VERSION 3.2.0
  11  * Written by David van der Spoel, Erik Lindahl, Berk Hess, and others.
  12  * Copyright (c) 1991-2000, University of Groningen, The Netherlands.
  13  * Copyright (c) 2001-2004, The GROMACS development team,
  14  * check out http://www.gromacs.org for more information.
  15
  16  * This program is free software; you can redistribute it and/or
  17  * modify it under the terms of the GNU General Public License
  18  * as published by the Free Software Foundation; either version 2
  19  * of the License, or (at your option) any later version.
  20  *
  21  * If you want to redistribute modifications, please consider that
  22  * scientific software is very special. Version control is crucial -
  23  * bugs must be traceable. We will be happy to consider code for
  24  * inclusion in the official distribution, but derived work must not
  25  * be called official GROMACS. Details are found in the README & COPYING
  26  * files - if they are missing, get the official version at www.gromacs.org.
  27  *
  28  * To help us fund GROMACS development, we humbly ask that you cite
  29  * the papers on the package - you can find them in the top README file.
  30  *
  31  * For more info, check our website at http://www.gromacs.org
  32  *
  33  * And Hey:
  34  * Green Red Orange Magenta Azure Cyan Skyblue
  35  */
  36 #ifdef HAVE_CONFIG_H
  37 #include <config.h>
  38 #endif
  39 #include <math.h>
  40 #include <string.h>
  41 #include "statutil.h"
  42 #include "sysstuff.h"
  43 #include "typedefs.h"
  44 #include "smalloc.h"
  45 #include "macros.h"
  46 #include "gmx_fatal.h"
  47 #include "vec.h"
  48 #include "copyrite.h"
  49 #include "futil.h"
  50 #include "readinp.h"
  51 #include "statutil.h"
  52 #include "txtdump.h"
  53 #include "gstat.h"
  54 #include "gmx_matrix.h"
  55 #include "gmx_statistics.h"
  56 #include "xvgr.h"
  57 #include "gmx_ana.h"
  58 #include "geminate.h"
  59
  60 /* must correspond to char *avbar_opt[] declared in main() */
  61 enum { avbarSEL, avbarNONE, avbarSTDDEV, avbarERROR, avbar90, avbarNR };
  62
  63 static void power_fit(int n,int nset,real **val,real *t)
  64 {
  65   real *x,*y,quality,a,b,r;
  66   int  s,i;
  67
  68   snew(x,n);
  69   snew(y,n);
  70
  71   if (t[0]>0) {
  72     for(i=0; i<n; i++)
  73       if (t[0]>0)
  74         x[i] = log(t[i]);
  75   } else {
  76     fprintf(stdout,"First time is not larger than 0, using index number as time for power fit\n");
  77     for(i=0; i<n; i++)
  78       x[i] = log(i+1);
  79   }
  80
  81   for(s=0; s<nset; s++) {
  82     i=0;
  83     for(i=0; i<n && val[s][i]>=0; i++)
  84       y[i] = log(val[s][i]);
  85     if (i < n)
  86       fprintf(stdout,"Will power fit up to point %d, since it is not larger than 0\n",i);
  87     lsq_y_ax_b(i,x,y,&a,&b,&r,&quality);
  88     fprintf(stdout,"Power fit set %3d:  error %.3f  a %g  b %g\n",
  89             s+1,quality,a,exp(b));
  90   }
  91
  92   sfree(y);
  93   sfree(x);
  94 }
  95
  96 static real cosine_content(int nhp,int n,real *y)
  97      /* Assumes n equidistant points */
  98 {
  99   double fac,cosyint,yyint;
 100   int i;
 101
 102   if (n < 2)
 103     return 0;
 104
 105   fac = M_PI*nhp/(n-1);
 106
 107   cosyint = 0;
 108   yyint = 0;
 109   for(i=0; i<n; i++) {
 110     cosyint += cos(fac*i)*y[i];
 111     yyint += y[i]*y[i];
 112   }
 113
 114   return 2*cosyint*cosyint/(n*yyint);
 115 }
 116
 117 static void plot_coscont(const char *ccfile,int n,int nset,real **val,
 118                          const output_env_t oenv)
 119 {
 120   FILE *fp;
 121   int  s;
 122   real cc;
 123
 124   fp = xvgropen(ccfile,"Cosine content","set / half periods","cosine content",
 125                 oenv);
 126
 127   for(s=0; s<nset; s++) {
 128     cc = cosine_content(s+1,n,val[s]);
 129     fprintf(fp," %d %g\n",s+1,cc);
 130     fprintf(stdout,"Cosine content of set %d with %.1f periods: %g\n",
 131             s+1,0.5*(s+1),cc);
 132   }
 133   fprintf(stdout,"\n");
 134
 135   ffclose(fp);
 136 }
 137
 138 static void regression_analysis(int n,bool bXYdy,
 139                                 real *x,int nset,real **val)
 140 {
 141   real S,chi2,a,b,da,db,r=0;
 142
 143   if (bXYdy || (nset == 1))
 144   {
 145       printf("Fitting data to a function f(x) = ax + b\n");
 146       printf("Minimizing residual chi2 = Sum_i w_i [f(x_i) - y_i]2\n");
 147       printf("Error estimates will be given if w_i (sigma) values are given\n");
 148       printf("(use option -xydy).\n\n");
 149       if (bXYdy)
 150           lsq_y_ax_b_error(n,x,val[0],val[1],&a,&b,&da,&db,&r,&S);
 151       else
 152           lsq_y_ax_b(n,x,val[0],&a,&b,&r,&S);
 153       chi2 = sqr((n-2)*S);
 154       printf("Chi2                    = %g\n",chi2);
 155       printf("S (Sqrt(Chi2/(n-2))     = %g\n",S);
 156       printf("Correlation coefficient = %.1f%%\n",100*r);
 157       printf("\n");
 158       if (bXYdy) {
 159           printf("a    = %g +/- %g\n",a,da);
 160           printf("b    = %g +/- %g\n",b,db);
 161       }
 162       else {
 163           printf("a    = %g\n",a);
 164           printf("b    = %g\n",b);
 165       }
 166   }
 167   else
 168   {
 169       double chi2,*a,**xx,*y;
 170       int i,j;
 171
 172       snew(y,n);
 173       snew(xx,nset-1);
 174       for(j=0; (j<nset-1); j++)
 175           snew(xx[j],n);
 176       for(i=0; (i<n); i++)
 177       {
 178           y[i] = val[0][i];
 179           for(j=1; (j<nset); j++)
 180               xx[j-1][i] = val[j][i];
 181       }
 182       snew(a,nset-1);
 183       chi2 = multi_regression(NULL,n,y,nset-1,xx,a);
 184       printf("Fitting %d data points in %d sets\n",n,nset-1);
 185       printf("chi2 = %g\n",chi2);
 186       printf("A =");
 187       for(i=0; (i<nset-1); i++)
 188       {
 189           printf("  %g",a[i]);
 190           sfree(xx[i]);
 191       }
 192       printf("\n");
 193       sfree(xx);
 194       sfree(y);
 195       sfree(a);
 196   }
 197 }
 198
 199 void histogram(const char *distfile,real binwidth,int n, int nset, real **val,
 200                const output_env_t oenv)
 201 {
 202   FILE *fp;
 203   int  i,s;
 204   double min,max;
 205   int  nbin;
 206 #if (defined SIZEOF_LONG_LONG_INT) && (SIZEOF_LONG_LONG_INT >= 8)
 207   long long int *histo;
 208 #else
 209   double        *histo;
 210 #endif
 211
 212   min = val[0][0];
 213   max = val[0][0];
 214   for(s=0; s<nset; s++)
 215     for(i=0; i<n; i++)
 216       if (val[s][i] < min)
 217         min = val[s][i];
 218       else if (val[s][i] > max)
 219         max = val[s][i];
 220
 221   min = binwidth*floor(min/binwidth);
 222   max = binwidth*ceil(max/binwidth);
 223   if (min != 0)
 224     min -= binwidth;
 225   max += binwidth;
 226
 227   nbin = (int)((max - min)/binwidth + 0.5) + 1;
 228   fprintf(stderr,"Making distributions with %d bins\n",nbin);
 229   snew(histo,nbin);
 230   fp = xvgropen(distfile,"Distribution","","",oenv);
 231   for(s=0; s<nset; s++) {
 232     for(i=0; i<nbin; i++)
 233       histo[i] = 0;
 234     for(i=0; i<n; i++)
 235       histo[(int)((val[s][i] - min)/binwidth + 0.5)]++;
 236     for(i=0; i<nbin; i++)
 237       fprintf(fp," %g  %g\n",min+i*binwidth,(double)histo[i]/(n*binwidth));
 238     if (s < nset-1)
 239       fprintf(fp,"&\n");
 240   }
 241   ffclose(fp);
 242 }
 243
 244 static int real_comp(const void *a,const void *b)
 245 {
 246   real dif = *(real *)a - *(real *)b;
 247
 248   if (dif < 0)
 249     return -1;
 250   else if (dif > 0)
 251     return 1;
 252   else
 253     return 0;
 254 }
 255
 256 static void average(const char *avfile,int avbar_opt,
 257                     int n, int nset,real **val,real *t)
 258 {
 259   FILE   *fp;
 260   int    i,s,edge=0;
 261   double av,var,err;
 262   real   *tmp=NULL;
 263
 264   fp = ffopen(avfile,"w");
 265   if ((avbar_opt == avbarERROR) && (nset == 1))
 266     avbar_opt = avbarNONE;
 267   if (avbar_opt != avbarNONE) {
 268     if (avbar_opt == avbar90) {
 269       snew(tmp,nset);
 270       fprintf(fp,"@TYPE xydydy\n");
 271       edge = (int)(nset*0.05+0.5);
 272       fprintf(stdout,"Errorbars: discarding %d points on both sides: %d%%"
 273               " interval\n",edge,(int)(100*(nset-2*edge)/nset+0.5));
 274     } else
 275       fprintf(fp,"@TYPE xydy\n");
 276   }
 277
 278   for(i=0; i<n; i++) {
 279     av = 0;
 280     for(s=0; s<nset; s++)
 281       av += val[s][i];
 282     av /= nset;
 283     fprintf(fp," %g %g",t[i],av);
 284     var = 0;
 285     if (avbar_opt != avbarNONE) {
 286       if (avbar_opt == avbar90) {
 287         for(s=0; s<nset; s++)
 288           tmp[s] = val[s][i];
 289         qsort(tmp,nset,sizeof(tmp[0]),real_comp);
 290         fprintf(fp," %g %g",tmp[nset-1-edge]-av,av-tmp[edge]);
 291       } else {
 292         for(s=0; s<nset; s++)
 293           var += sqr(val[s][i]-av);
 294         if (avbar_opt == avbarSTDDEV)
 295           err = sqrt(var/nset);
 296         else
 297           err = sqrt(var/(nset*(nset-1)));
 298         fprintf(fp," %g",err);
 299       }
 300     }
 301     fprintf(fp,"\n");
 302   }
 303   ffclose(fp);
 304
 305   if (avbar_opt == avbar90)
 306     sfree(tmp);
 307 }
 308
 309 static real anal_ee_inf(real *parm,real T)
 310 {
 311   return sqrt(parm[1]*2*parm[0]/T+parm[3]*2*parm[2]/T);
 312 }
 313
 314 static real anal_ee(real *parm,real T,real t)
 315 {
 316   real e1,e2;
 317
 318   if (parm[0])
 319     e1 = exp(-t/parm[0]);
 320   else
 321     e1 = 1;
 322   if (parm[2])
 323     e2 = exp(-t/parm[2]);
 324   else
 325     e2 = 1;
 326
 327   return sqrt(parm[1]*2*parm[0]/T*((e1 - 1)*parm[0]/t + 1) +
 328               parm[3]*2*parm[2]/T*((e2 - 1)*parm[2]/t + 1));
 329 }
 330
 331 static void estimate_error(const char *eefile,int nb_min,int resol,int n,
 332                            int nset, double *av,double *sig,real **val,real dt,
 333                            bool bFitAc,bool bSingleExpFit,bool bAllowNegLTCorr,
 334                            const output_env_t oenv)
 335 {
 336     FILE   *fp;
 337     int    bs,prev_bs,nbs,nb;
 338     real   spacing,nbr;
 339     int    s,i,j;
 340     double blav,var;
 341     char   **leg;
 342     real   *tbs,*ybs,rtmp,dens,*fitsig,twooe,tau1_est,tau_sig;
 343     real   fitparm[4];
 344     real   ee,a,tau1,tau2;
 345
 346     if (n < 4)
 347     {
 348       fprintf(stdout,"The number of points is smaller than 4, can not make an error estimate\n");
 349
 350       return;
 351     }
 352
 353     fp = xvgropen(eefile,"Error estimates",
 354                   "Block size (time)","Error estimate", oenv);
 355     if (output_env_get_print_xvgr_codes(oenv))
 356     {
 357         fprintf(fp,
 358                 "@ subtitle \"using block averaging, total time %g (%d points)\"\n",
 359                 (n-1)*dt,n);
 360     }
 361     snew(leg,2*nset);
 362     xvgr_legend(fp,2*nset,leg,oenv);
 363     sfree(leg);
 364
 365     spacing = pow(2,1.0/resol);
 366     snew(tbs,n);
 367     snew(ybs,n);
 368     snew(fitsig,n);
 369     for(s=0; s<nset; s++)
 370     {
 371         nbs = 0;
 372         prev_bs = 0;
 373         nbr = nb_min;
 374         while (nbr <= n)
 375         {
 376             bs = n/(int)nbr;
 377             if (bs != prev_bs)
 378             {
 379                 nb = n/bs;
 380                 var = 0;
 381                 for(i=0; i<nb; i++)
 382                 {
 383                     blav=0;
 384                     for (j=0; j<bs; j++)
 385                     {
 386                         blav += val[s][bs*i+j];
 387                     }
 388                     var += sqr(av[s] - blav/bs);
 389                 }
 390                 tbs[nbs] = bs*dt;
 391                 if (sig[s] == 0)
 392                 {
 393                     ybs[nbs] = 0;
 394                 }
 395                 else
 396                 {
 397                     ybs[nbs] = var/(nb*(nb-1.0))*(n*dt)/(sig[s]*sig[s]);
 398                 }
 399                 nbs++;
 400             }
 401             nbr *= spacing;
 402             nb = (int)(nbr+0.5);
 403             prev_bs = bs;
 404         }
 405         if (sig[s] == 0)
 406         {
 407             ee   = 0;
 408             a    = 1;
 409             tau1 = 0;
 410             tau2 = 0;
 411         }
 412         else
 413         {
 414             for(i=0; i<nbs/2; i++)
 415             {
 416                 rtmp         = tbs[i];
 417                 tbs[i]       = tbs[nbs-1-i];
 418                 tbs[nbs-1-i] = rtmp;
 419                 rtmp         = ybs[i];
 420                 ybs[i]       = ybs[nbs-1-i];
 421                 ybs[nbs-1-i] = rtmp;
 422             }
 423             /* The initial slope of the normalized ybs^2 is 1.
 424              * For a single exponential autocorrelation: ybs(tau1) = 2/e tau1
 425              * From this we take our initial guess for tau1.
 426              */
 427             twooe = 2/exp(1);
 428             i = -1;
 429             do
 430             {
 431                 i++;
 432                 tau1_est = tbs[i];
 433             } while (i < nbs - 1 &&
 434                      (ybs[i] > ybs[i+1] || ybs[i] > twooe*tau1_est));
 435
 436             if (ybs[0] > ybs[1])
 437             {
 438                 fprintf(stdout,"Data set %d has strange time correlations:\n"
 439                         "the std. error using single points is larger than that of blocks of 2 points\n"
 440                         "The error estimate might be inaccurate, check the fit\n",
 441                         s+1);
 442                 /* Use the total time as tau for the fitting weights */
 443                 tau_sig = (n - 1)*dt;
 444             }
 445             else
 446             {
 447                 tau_sig = tau1_est;
 448             }
 449
 450             if (debug)
 451             {
 452                 fprintf(debug,"set %d tau1 estimate %f\n",s+1,tau1_est);
 453             }
 454
 455             /* Generate more or less appropriate sigma's,
 456              * also taking the density of points into account.
 457              */
 458             for(i=0; i<nbs; i++)
 459             {
 460                 if (i == 0)
 461                 {
 462                     dens = tbs[1]/tbs[0] - 1;
 463                 }
 464                 else if (i == nbs-1)
 465                 {
 466                     dens = tbs[nbs-1]/tbs[nbs-2] - 1;
 467                 }
 468                 else
 469                 {
 470                     dens = 0.5*(tbs[i+1]/tbs[i-1] - 1);
 471                 }
 472                 fitsig[i] = sqrt((tau_sig + tbs[i])/dens);
 473             }
 474
 475             if (!bSingleExpFit)
 476             {
 477                 fitparm[0] = tau1_est;
 478                 fitparm[1] = 0.95;
 479                 /* We set the initial guess for tau2
 480                  * to halfway between tau1_est and the total time (on log scale).
 481                  */
 482                 fitparm[2] = sqrt(tau1_est*(n-1)*dt);
 483                 do_lmfit(nbs,ybs,fitsig,0,tbs,0,dt*n,oenv,
 484                          bDebugMode(),effnERREST,fitparm,0);
 485                 fitparm[3] = 1-fitparm[1];
 486             }
 487             if (bSingleExpFit || fitparm[0]<0 || fitparm[2]<0 || fitparm[1]<0
 488                 || (fitparm[1]>1 && !bAllowNegLTCorr) || fitparm[2]>(n-1)*dt)
 489             {
 490                 if (!bSingleExpFit)
 491                 {
 492                     if (fitparm[2] > (n-1)*dt)
 493                     {
 494                         fprintf(stdout,
 495                                 "Warning: tau2 is longer than the length of the data (%g)\n"
 496                                 "         the statistics might be bad\n",
 497                                 (n-1)*dt);
 498                     }
 499                     else
 500                     {
 501                         fprintf(stdout,"a fitted parameter is negative\n");
 502                     }
 503                     fprintf(stdout,"invalid fit:  e.e. %g  a %g  tau1 %g  tau2 %g\n",
 504                             sig[s]*anal_ee_inf(fitparm,n*dt),
 505                             fitparm[1],fitparm[0],fitparm[2]);
 506                     /* Do a fit with tau2 fixed at the total time.
 507                      * One could also choose any other large value for tau2.
 508                      */
 509                     fitparm[0] = tau1_est;
 510                     fitparm[1] = 0.95;
 511                     fitparm[2] = (n-1)*dt;
 512                     fprintf(stderr,"Will fix tau2 at the total time: %g\n",fitparm[2]);
 513                     do_lmfit(nbs,ybs,fitsig,0,tbs,0,dt*n,oenv,bDebugMode(),
 514                              effnERREST,fitparm,4);
 515                     fitparm[3] = 1-fitparm[1];
 516                 }
 517                 if (bSingleExpFit || fitparm[0]<0 || fitparm[1]<0
 518                     || (fitparm[1]>1 && !bAllowNegLTCorr))
 519                 {
 520                     if (!bSingleExpFit) {
 521                         fprintf(stdout,"a fitted parameter is negative\n");
 522                         fprintf(stdout,"invalid fit:  e.e. %g  a %g  tau1 %g  tau2 %g\n",
 523                                 sig[s]*anal_ee_inf(fitparm,n*dt),
 524                                 fitparm[1],fitparm[0],fitparm[2]);
 525                     }
 526                     /* Do a single exponential fit */
 527                     fprintf(stderr,"Will use a single exponential fit for set %d\n",s+1);
 528                     fitparm[0] = tau1_est;
 529                     fitparm[1] = 1.0;
 530                     fitparm[2] = 0.0;
 531                     do_lmfit(nbs,ybs,fitsig,0,tbs,0,dt*n,oenv,bDebugMode(),
 532                              effnERREST,fitparm,6);
 533                     fitparm[3] = 1-fitparm[1];
 534                 }
 535             }
 536             ee   = sig[s]*anal_ee_inf(fitparm,n*dt);
 537             a    = fitparm[1];
 538             tau1 = fitparm[0];
 539             tau2 = fitparm[2];
 540         }
 541         fprintf(stdout,"Set %3d:  err.est. %g  a %g  tau1 %g  tau2 %g\n",
 542                 s+1,ee,a,tau1,tau2);
 543         fprintf(fp,"@ legend string %d \"av %f\"\n",2*s,av[s]);
 544         fprintf(fp,"@ legend string %d \"ee %6g\"\n",
 545                 2*s+1,sig[s]*anal_ee_inf(fitparm,n*dt));
 546         for(i=0; i<nbs; i++)
 547         {
 548             fprintf(fp,"%g %g %g\n",tbs[i],sig[s]*sqrt(ybs[i]/(n*dt)),
 549                     sig[s]*sqrt(fit_function(effnERREST,fitparm,tbs[i])/(n*dt)));
 550         }
 551
 552         if (bFitAc)
 553         {
 554             int fitlen;
 555             real *ac,acint,ac_fit[4];
 556
 557             snew(ac,n);
 558             for(i=0; i<n; i++) {
 559                 ac[i] = val[s][i] - av[s];
 560                 if (i > 0)
 561                     fitsig[i] = sqrt(i);
 562                 else
 563                     fitsig[i] = 1;
 564             }
 565             low_do_autocorr(NULL,oenv,NULL,n,1,-1,&ac,
 566                             dt,eacNormal,1,FALSE,TRUE,
 567                             FALSE,0,0,effnNONE,0);
 568
 569             fitlen = n/nb_min;
 570
 571             /* Integrate ACF only up to fitlen/2 to avoid integrating noise */
 572             acint = 0.5*ac[0];
 573             for(i=1; i<=fitlen/2; i++)
 574             {
 575                 acint += ac[i];
 576             }
 577             acint *= dt;
 578
 579             /* Generate more or less appropriate sigma's */
 580             for(i=0; i<=fitlen; i++)
 581             {
 582                 fitsig[i] = sqrt(acint + dt*i);
 583             }
 584
 585             ac_fit[0] = 0.5*acint;
 586             ac_fit[1] = 0.95;
 587             ac_fit[2] = 10*acint;
 588             do_lmfit(n/nb_min,ac,fitsig,dt,0,0,fitlen*dt,oenv,
 589                      bDebugMode(),effnEXP3,ac_fit,0);
 590             ac_fit[3] = 1 - ac_fit[1];
 591
 592             fprintf(stdout,"Set %3d:  ac erest %g  a %g  tau1 %g  tau2 %g\n",
 593                     s+1,sig[s]*anal_ee_inf(ac_fit,n*dt),
 594                     ac_fit[1],ac_fit[0],ac_fit[2]);
 595
 596             fprintf(fp,"&\n");
 597             for(i=0; i<nbs; i++)
 598             {
 599                 fprintf(fp,"%g %g\n",tbs[i],
 600                         sig[s]*sqrt(fit_function(effnERREST,ac_fit,tbs[i]))/(n*dt));
 601             }
 602
 603             sfree(ac);
 604         }
 605         if (s < nset-1)
 606         {
 607             fprintf(fp,"&\n");
 608         }
 609     }
 610     sfree(fitsig);
 611     sfree(ybs);
 612     sfree(tbs);
 613     ffclose(fp);
 614 }
 615
 616 static void luzar_correl(int nn,real *time,int nset,real **val,real temp,
 617                          bool bError,real fit_start,real smooth_tail_start,
 618                          const output_env_t oenv)
 619 {
 620   const real tol = 1e-8;
 621   real *kt;
 622   real weight,d2;
 623   int  j;
 624
 625   please_cite(stdout,"Spoel2006b");
 626
 627   /* Compute negative derivative k(t) = -dc(t)/dt */
 628   if (!bError) {
 629     snew(kt,nn);
 630     compute_derivative(nn,time,val[0],kt);
 631     for(j=0; (j<nn); j++)
 632       kt[j] = -kt[j];
 633     if (debug) {
 634       d2 = 0;
 635       for(j=0; (j<nn); j++)
 636         d2 += sqr(kt[j] - val[3][j]);
 637       fprintf(debug,"RMS difference in derivatives is %g\n",sqrt(d2/nn));
 638     }
 639     analyse_corr(nn,time,val[0],val[2],kt,NULL,NULL,NULL,fit_start,
 640                  temp,smooth_tail_start,oenv);
 641     sfree(kt);
 642   }
 643   else if (nset == 6) {
 644     analyse_corr(nn,time,val[0],val[2],val[4],
 645                  val[1],val[3],val[5],fit_start,temp,smooth_tail_start,oenv);
 646   }
 647   else {
 648     printf("Inconsistent input. I need c(t) sigma_c(t) n(t) sigma_n(t) K(t) sigma_K(t)\n");
 649     printf("Not doing anything. Sorry.\n");
 650   }
 651 }
 652
 653 static void filter(real flen,int n,int nset,real **val,real dt,
 654                    const output_env_t oenv)
 655 {
 656   int    f,s,i,j;
 657   double *filt,sum,vf,fluc,fluctot;
 658
 659   f = (int)(flen/(2*dt));
 660   snew(filt,f+1);
 661   filt[0] = 1;
 662   sum = 1;
 663   for(i=1; i<=f; i++) {
 664     filt[i] = cos(M_PI*dt*i/flen);
 665     sum += 2*filt[i];
 666   }
 667   for(i=0; i<=f; i++)
 668     filt[i] /= sum;
 669   fprintf(stdout,"Will calculate the fluctuation over %d points\n",n-2*f);
 670   fprintf(stdout,"  using a filter of length %g of %d points\n",flen,2*f+1);
 671   fluctot = 0;
 672   for(s=0; s<nset; s++) {
 673     fluc = 0;
 674     for(i=f; i<n-f; i++) {
 675       vf = filt[0]*val[s][i];
 676       for(j=1; j<=f; j++)
 677         vf += filt[j]*(val[s][i-f]+val[s][i+f]);
 678       fluc += sqr(val[s][i] - vf);
 679     }
 680     fluc /= n - 2*f;
 681     fluctot += fluc;
 682     fprintf(stdout,"Set %3d filtered fluctuation: %12.6e\n",s+1,sqrt(fluc));
 683   }
 684   fprintf(stdout,"Overall filtered fluctuation: %12.6e\n",sqrt(fluctot/nset));
 685   fprintf(stdout,"\n");
 686
 687   sfree(filt);
 688 }
 689
 690 static void do_fit(FILE *out,int n,bool bYdy,int ny,real *x0,real **val,
 691                    int npargs,t_pargs *ppa,const output_env_t oenv)
 692 {
 693   real *c1=NULL,*sig=NULL,*fitparm;
 694   real dt=0,tendfit,tbeginfit;
 695   int  i,efitfn,nparm;
 696
 697   efitfn = get_acffitfn();
 698   nparm  = nfp_ffn[efitfn];
 699   fprintf(out,"Will fit to the following function:\n");
 700   fprintf(out,"%s\n",longs_ffn[efitfn]);
 701   c1 = val[n];
 702   if (bYdy) {
 703     c1  = val[n];
 704     sig = val[n+1];
 705     fprintf(out,"Using two columns as y and sigma values\n");
 706   } else {
 707     snew(sig,ny);
 708   }
 709   if (opt2parg_bSet("-beginfit",npargs,ppa)) {
 710     tbeginfit = opt2parg_real("-beginfit",npargs,ppa);
 711   } else {
 712     tbeginfit = x0 ? x0[0]    : 0;
 713   }
 714   if (opt2parg_bSet("-endfit",npargs,ppa)) {
 715     tendfit   = opt2parg_real("-endfit",npargs,ppa);
 716   } else {
 717     tendfit   = x0 ? x0[ny-1] : (ny-1)*dt;
 718   }
 719
 720   snew(fitparm,nparm);
 721   switch(efitfn) {
 722   case effnEXP1:
 723     fitparm[0] = 0.5;
 724     break;
 725   case effnEXP2:
 726     fitparm[0] = 0.5;
 727     fitparm[1] = c1[0];
 728     break;
 729   case effnEXP3:
 730     fitparm[0] = 1.0;
 731     fitparm[1] = 0.5*c1[0];
 732     fitparm[2] = 10.0;
 733     break;
 734   case effnEXP5:
 735     fitparm[0] = fitparm[2] = 0.5*c1[0];
 736     fitparm[1] = 10;
 737     fitparm[3] = 40;
 738     fitparm[4] = 0;
 739     break;
 740   case effnEXP7:
 741     fitparm[0] = fitparm[2] = fitparm[4] = 0.33*c1[0];
 742     fitparm[1] = 1;
 743     fitparm[3] = 10;
 744     fitparm[5] = 100;
 745     fitparm[6] = 0;
 746     break;
 747   case effnEXP9:
 748     fitparm[0] = fitparm[2] = fitparm[4] = fitparm[6] = 0.25*c1[0];
 749     fitparm[1] = 0.1;
 750     fitparm[3] = 1;
 751     fitparm[5] = 10;
 752     fitparm[7] = 100;
 753     fitparm[8] = 0;
 754     break;
 755   default:
 756     fprintf(out,"Warning: don't know how to initialize the parameters\n");
 757     for(i=0; (i<nparm); i++)
 758       fitparm[i] = 1;
 759   }
 760   fprintf(out,"Starting parameters:\n");
 761   for(i=0; (i<nparm); i++)
 762     fprintf(out,"a%-2d = %12.5e\n",i+1,fitparm[i]);
 763   if (do_lmfit(ny,c1,sig,dt,x0,tbeginfit,tendfit,
 764                oenv,bDebugMode(),efitfn,fitparm,0)) {
 765     for(i=0; (i<nparm); i++)
 766       fprintf(out,"a%-2d = %12.5e\n",i+1,fitparm[i]);
 767   }
 768   else {
 769     fprintf(out,"No solution was found\n");
 770   }
 771 }
 772
 773 static void do_ballistic(const char *balFile, int nData,
 774                          real *t, real **val, int nSet,
 775                          real balTime, int nBalExp,
 776                          bool bDerivative,
 777                          const output_env_t oenv)
 778 {
 779   double **ctd=NULL, *td=NULL;
 780   t_gemParams *GP = init_gemParams(0, 0, t, 0, nData, balTime, nBalExp, bDerivative);
 781   static char *leg[] = {"Ac'(t)"};
 782   FILE *fp;
 783   int i, set;
 784
 785   if (GP->ballistic/GP->tDelta >= GP->nExpFit*2+1)
 786   {
 787       snew(ctd, nSet);
 788       snew(td,  nData);
 789
 790       fp = xvgropen(balFile, "Hydrogen Bond Autocorrelation","Time (ps)","C'(t)", oenv);
 791       xvgr_legend(fp,asize(leg),leg,oenv);
 792
 793       for (set=0; set<nSet; set++)
 794       {
 795           snew(ctd[set], nData);
 796           for (i=0; i<nData; i++) {
 797               ctd[set][i] = (double)val[set][i];
 798               if (set==0)
 799                   td[i] = (double)t[i];
 800           }
 801
 802           takeAwayBallistic(ctd[set], td, nData, GP->ballistic, GP->nExpFit, GP->bDt);
 803       }
 804
 805       for (i=0; i<nData; i++)
 806       {
 807           fprintf(fp, "  %g",t[i]);
 808           for (set=0; set<nSet; set++)
 809           {
 810               fprintf(fp, "  %g", ctd[set][i]);
 811           }
 812           fprintf(fp, "\n");
 813       }
 814
 815
 816       for (set=0; set<nSet; set++)
 817           sfree(ctd[set]);
 818       sfree(ctd);
 819       sfree(td);
 820   }
 821   else
 822       printf("Number of data points is less than the number of parameters to fit\n."
 823              "The system is underdetermined, hence no ballistic term can be found.\n\n");
 824 }
 825
 826 static void do_geminate(const char *gemFile, int nData,
 827                         real *t, real **val, int nSet,
 828                         const real D, const real logAfterTime,
 829                         real rcut, real balTime,
 830                         const output_env_t oenv)
 831 {
 832     double **ctd=NULL, **ctdGem=NULL, *td=NULL;
 833     t_gemParams *GP = init_gemParams(rcut, D, t, logAfterTime,
 834                                      nData, balTime, 1, FALSE);
 835     static char *leg[] = {"Ac\\sgem\\N(t)"};
 836     FILE *fp;
 837     int i, set;
 838
 839     snew(ctd,    nSet);
 840     snew(ctdGem, nSet);
 841     snew(td,  nData);
 842
 843     fp = xvgropen(gemFile, "Hydrogen Bond Autocorrelation","Time (ps)","C'(t)", oenv);
 844     xvgr_legend(fp,asize(leg),leg,oenv);
 845
 846     for (set=0; set<nSet; set++)
 847     {
 848         snew(ctd[set],    nData);
 849         snew(ctdGem[set], nData);
 850         for (i=0; i<nData; i++) {
 851             ctd[set][i] = (double)val[set][i];
 852             if (set==0)
 853                 td[i] = (double)t[i];
 854         }
 855         fitGemRecomb(ctd[set], td, &(ctd[set]), nData, GP);
 856     }
 857
 858     for (i=0; i<nData; i++)
 859         {
 860         fprintf(fp, "  %g",t[i]);
 861         for (set=0; set<nSet; set++)
 862             {
 863             fprintf(fp, "  %g", ctdGem[set][i]);
 864             }
 865         fprintf(fp, "\n");
 866         }
 867
 868     for (set=0; set<nSet; set++)
 869     {
 870         sfree(ctd[set]);
 871         sfree(ctdGem[set]);
 872     }
 873     sfree(ctd);
 874     sfree(ctdGem);
 875     sfree(td);
 876 }
 877
 878 int gmx_analyze(int argc,char *argv[])
 879 {
 880   static const char *desc[] = {
 881     "g_analyze reads an ascii file and analyzes data sets.",
 882     "A line in the input file may start with a time",
 883     "(see option [TT]-time[tt]) and any number of y values may follow.",
 884     "Multiple sets can also be",
 885     "read when they are seperated by & (option [TT]-n[tt]),",
 886     "in this case only one y value is read from each line.",
 887     "All lines starting with # and @ are skipped.",
 888     "All analyses can also be done for the derivative of a set",
 889     "(option [TT]-d[tt]).[PAR]",
 890
 891     "All options, except for [TT]-av[tt] and [TT]-power[tt] assume that the",
 892     "points are equidistant in time.[PAR]",
 893
 894     "g_analyze always shows the average and standard deviation of each",
 895     "set. For each set it also shows the relative deviation of the third",
 896     "and forth cumulant from those of a Gaussian distribution with the same",
 897     "standard deviation.[PAR]",
 898
 899     "Option [TT]-ac[tt] produces the autocorrelation function(s).[PAR]",
 900
 901     "Option [TT]-cc[tt] plots the resemblance of set i with a cosine of",
 902     "i/2 periods. The formula is:[BR]"
 903     "2 (int0-T y(t) cos(i pi t) dt)^2 / int0-T y(t) y(t) dt[BR]",
 904     "This is useful for principal components obtained from covariance",
 905     "analysis, since the principal components of random diffusion are",
 906     "pure cosines.[PAR]",
 907
 908     "Option [TT]-msd[tt] produces the mean square displacement(s).[PAR]",
 909
 910     "Option [TT]-dist[tt] produces distribution plot(s).[PAR]",
 911
 912     "Option [TT]-av[tt] produces the average over the sets.",
 913     "Error bars can be added with the option [TT]-errbar[tt].",
 914     "The errorbars can represent the standard deviation, the error",
 915     "(assuming the points are independent) or the interval containing",
 916     "90% of the points, by discarding 5% of the points at the top and",
 917     "the bottom.[PAR]",
 918
 919     "Option [TT]-ee[tt] produces error estimates using block averaging.",
 920     "A set is divided in a number of blocks and averages are calculated for",
 921     "each block. The error for the total average is calculated from",
 922     "the variance between averages of the m blocks B_i as follows:",
 923     "error^2 = Sum (B_i - <B>)^2 / (m*(m-1)).",
 924     "These errors are plotted as a function of the block size.",
 925     "Also an analytical block average curve is plotted, assuming",
 926     "that the autocorrelation is a sum of two exponentials.",
 927     "The analytical curve for the block average is:[BR]",
 928     "f(t) = sigma sqrt(2/T (  a   (tau1 ((exp(-t/tau1) - 1) tau1/t + 1)) +[BR]",
 929     "                       (1-a) (tau2 ((exp(-t/tau2) - 1) tau2/t + 1)))),[BR]"
 930     "where T is the total time.",
 931     "a, tau1 and tau2 are obtained by fitting f^2(t) to error^2.",
 932     "When the actual block average is very close to the analytical curve,",
 933     "the error is sigma*sqrt(2/T (a tau1 + (1-a) tau2)).",
 934     "The complete derivation is given in",
 935     "B. Hess, J. Chem. Phys. 116:209-217, 2002.[PAR]",
 936
 937     "Option [TT]-bal[TT] finds and subtracts the ultrafast \"ballistic\"",
 938     "component from a hydrogen bond autocorrelation function by the fitting",
 939     "of a sum of exponentials, as described in e.g.",
 940     "O. Markovitch, J. Chem. Phys. 129:084505, 2008. The fastest term",
 941     "is the one with the most negative coefficient in the exponential,",
 942     "or with [TT]-d[TT], the one with most negative time derivative at time 0.",
 943     "[]TT-nbalexp[TT] sets the number of exponentials to fit.[PAR]",
 944
 945     "Option [TT]-gem[TT] fits bimolecular rate constants ka and kb",
 946     "(and optionally kD) to the hydrogen bond autocorrelation function",
 947     "according to the reversible geminate recombination model. Removal of",
 948     "the ballistic component first is strongly adviced. The model is presented in",
 949     "O. Markovitch, J. Chem. Phys. 129:084505, 2008.[PAR]",
 950
 951     "Option [TT]-filter[tt] prints the RMS high-frequency fluctuation",
 952     "of each set and over all sets with respect to a filtered average.",
 953     "The filter is proportional to cos(pi t/len) where t goes from -len/2",
 954     "to len/2. len is supplied with the option [TT]-filter[tt].",
 955     "This filter reduces oscillations with period len/2 and len by a factor",
 956     "of 0.79 and 0.33 respectively.[PAR]",
 957
 958     "Option [TT]-g[tt] fits the data to the function given with option",
 959     "[TT]-fitfn[tt].[PAR]",
 960
 961     "Option [TT]-power[tt] fits the data to b t^a, which is accomplished",
 962     "by fitting to a t + b on log-log scale. All points after the first",
 963     "zero or negative value are ignored.[PAR]"
 964
 965     "Option [TT]-luzar[tt] performs a Luzar & Chandler kinetics analysis",
 966     "on output from [TT]g_hbond[tt]. The input file can be taken directly",
 967     "from [TT]g_hbond -ac[tt], and then the same result should be produced."
 968   };
 969   static real tb=-1,te=-1,frac=0.5,filtlen=0,binwidth=0.1,aver_start=0;
 970   static bool bHaveT=TRUE,bDer=FALSE,bSubAv=TRUE,bAverCorr=FALSE,bXYdy=FALSE;
 971   static bool bEESEF=FALSE,bEENLC=FALSE,bEeFitAc=FALSE,bPower=FALSE;
 972   static bool bIntegrate=FALSE,bRegression=FALSE,bLuzar=FALSE,bLuzarError=FALSE;
 973   static int  nsets_in=1,d=1,nb_min=4,resol=10, nBalExp=4;
 974   static real temp=298.15,fit_start=1,smooth_tail_start=-1, logAfterTime=10, balTime=0.2, diffusion=0,rcut=0.35;
 975
 976   /* must correspond to enum avbar* declared at beginning of file */
 977   static const char *avbar_opt[avbarNR+1] = {
 978     NULL, "none", "stddev", "error", "90", NULL
 979   };
 980
 981   t_pargs pa[] = {
 982     { "-time",    FALSE, etBOOL, {&bHaveT},
 983       "Expect a time in the input" },
 984     { "-b",       FALSE, etREAL, {&tb},
 985       "First time to read from set" },
 986     { "-e",       FALSE, etREAL, {&te},
 987       "Last time to read from set" },
 988     { "-n",       FALSE, etINT, {&nsets_in},
 989       "Read # sets seperated by &" },
 990     { "-d",       FALSE, etBOOL, {&bDer},
 991         "Use the derivative" },
 992     { "-dp",      FALSE, etINT, {&d},
 993       "HIDDENThe derivative is the difference over # points" },
 994     { "-bw",      FALSE, etREAL, {&binwidth},
 995       "Binwidth for the distribution" },
 996     { "-errbar",  FALSE, etENUM, {avbar_opt},
 997       "Error bars for -av" },
 998     { "-integrate",FALSE,etBOOL, {&bIntegrate},
 999       "Integrate data function(s) numerically using trapezium rule" },
1000     { "-aver_start",FALSE, etREAL, {&aver_start},
1001       "Start averaging the integral from here" },
1002     { "-xydy",    FALSE, etBOOL, {&bXYdy},
1003       "Interpret second data set as error in the y values for integrating" },
1004     { "-regression",FALSE,etBOOL,{&bRegression},
1005       "Perform a linear regression analysis on the data. If -xydy is set a second set will be interpreted as the error bar in the Y value. Otherwise, if multiple data sets are present a multilinear regression will be performed yielding the constant A that minimize chi^2 = (y - A0 x0 - A1 x1 - ... - AN xN)^2 where now Y is the first data set in the input file and xi the others. Do read the information at the option [TT]-time[tt]." },
1006     { "-luzar",   FALSE, etBOOL, {&bLuzar},
1007       "Do a Luzar and Chandler analysis on a correlation function and related as produced by g_hbond. When in addition the -xydy flag is given the second and fourth column will be interpreted as errors in c(t) and n(t)." },
1008     { "-temp",    FALSE, etREAL, {&temp},
1009       "Temperature for the Luzar hydrogen bonding kinetics analysis" },
1010     { "-fitstart", FALSE, etREAL, {&fit_start},
1011       "Time (ps) from which to start fitting the correlation functions in order to obtain the forward and backward rate constants for HB breaking and formation" },
1012     { "-smooth",FALSE, etREAL, {&smooth_tail_start},
1013       "If >= 0, the tail of the ACF will be smoothed by fitting it to an exponential function: y = A exp(-x/tau)" },
1014     { "-nbmin",   FALSE, etINT, {&nb_min},
1015       "HIDDENMinimum number of blocks for block averaging" },
1016     { "-resol", FALSE, etINT, {&resol},
1017       "HIDDENResolution for the block averaging, block size increases with"
1018     " a factor 2^(1/#)" },
1019     { "-eeexpfit", FALSE, etBOOL, {&bEESEF},
1020       "HIDDENAlways use a single exponential fit for the error estimate" },
1021     { "-eenlc", FALSE, etBOOL, {&bEENLC},
1022       "HIDDENAllow a negative long-time correlation" },
1023     { "-eefitac", FALSE, etBOOL, {&bEeFitAc},
1024       "HIDDENAlso plot analytical block average using a autocorrelation fit" },
1025     { "-filter",  FALSE, etREAL, {&filtlen},
1026       "Print the high-frequency fluctuation after filtering with a cosine filter of length #" },
1027     { "-power", FALSE, etBOOL, {&bPower},
1028       "Fit data to: b t^a" },
1029     { "-subav", FALSE, etBOOL, {&bSubAv},
1030       "Subtract the average before autocorrelating" },
1031     { "-oneacf", FALSE, etBOOL, {&bAverCorr},
1032       "Calculate one ACF over all sets" },
1033     { "-nbalexp", FALSE, etINT, {&nBalExp},
1034       "HIDDENNumber of exponentials to fit to the ultrafast component" },
1035     { "-baltime", FALSE, etREAL, {&balTime},
1036       "HIDDENTime up to which the ballistic component will be fitted" },
1037     { "-rcut", FALSE, etREAL, {&rcut},
1038       "Cut-off for hydrogen bonds in geminate algorithms" },
1039     { "-gemtype", FALSE, etENUM, {gemType},
1040       "What type of gminate recombination to use"},
1041     { "-D", FALSE, etREAL, {&diffusion},
1042       "The self diffusion coefficient which is used for the reversible geminate recombination model."
1043       "If non-positive, then the diffusion coefficient will be one of the parameters fitted"}
1044   };
1045 #define NPA asize(pa)
1046
1047   FILE     *out,*out_fit;
1048   int      n,nlast,s,nset,i,j=0;
1049   real     **val,*t,dt,tot,error;
1050   double   *av,*sig,cum1,cum2,cum3,cum4,db;
1051   const char     *acfile,*msdfile,*ccfile,*distfile,*avfile,*eefile,*balfile,*gemfile,*fitfile;
1052   output_env_t oenv;
1053
1054   t_filenm fnm[] = {
1055     { efXVG, "-f",    "graph",    ffREAD   },
1056     { efXVG, "-ac",   "autocorr", ffOPTWR  },
1057     { efXVG, "-msd",  "msd",      ffOPTWR  },
1058     { efXVG, "-cc",   "coscont",  ffOPTWR  },
1059     { efXVG, "-dist", "distr",    ffOPTWR  },
1060     { efXVG, "-av",   "average",  ffOPTWR  },
1061     { efXVG, "-ee",   "errest",   ffOPTWR  },
1062     { efXVG, "-bal",  "ballisitc",ffOPTWR  },
1063     { efXVG, "-gem",  "geminate", ffOPTWR  },
1064     { efLOG, "-g",    "fitlog",   ffOPTWR  }
1065   };
1066 #define NFILE asize(fnm)
1067
1068   int     npargs;
1069   t_pargs *ppa;
1070
1071   npargs = asize(pa);
1072   ppa    = add_acf_pargs(&npargs,pa);
1073
1074   CopyRight(stderr,argv[0]);
1075   parse_common_args(&argc,argv,PCA_CAN_VIEW,
1076                     NFILE,fnm,npargs,ppa,asize(desc),desc,0,NULL,&oenv);
1077
1078   acfile   = opt2fn_null("-ac",NFILE,fnm);
1079   msdfile  = opt2fn_null("-msd",NFILE,fnm);
1080   ccfile   = opt2fn_null("-cc",NFILE,fnm);
1081   distfile = opt2fn_null("-dist",NFILE,fnm);
1082   avfile   = opt2fn_null("-av",NFILE,fnm);
1083   eefile   = opt2fn_null("-ee",NFILE,fnm);
1084   balfile  = opt2fn_null("-bal",NFILE,fnm);
1085   gemfile  = opt2fn_null("-gem",NFILE,fnm);
1086   if (opt2parg_bSet("-fitfn",npargs,ppa))
1087     fitfile  = opt2fn("-g",NFILE,fnm);
1088   else
1089     fitfile  = opt2fn_null("-g",NFILE,fnm);
1090
1091   val=read_xvg_time(opt2fn("-f",NFILE,fnm),bHaveT,
1092                     opt2parg_bSet("-b",npargs,ppa),tb,
1093                     opt2parg_bSet("-e",npargs,ppa),te,
1094                     nsets_in,&nset,&n,&dt,&t);
1095   printf("Read %d sets of %d points, dt = %g\n\n",nset,n,dt);
1096
1097   if (bDer) {
1098     printf("Calculating the derivative as (f[i+%d]-f[i])/(%d*dt)\n\n",
1099             d,d);
1100     n -= d;
1101     for(s=0; s<nset; s++)
1102       for(i=0; (i<n); i++)
1103         val[s][i] = (val[s][i+d]-val[s][i])/(d*dt);
1104   }
1105   if (bIntegrate) {
1106     real sum,stddev;
1107     printf("Calculating the integral using the trapezium rule\n");
1108
1109     if (bXYdy) {
1110       sum = evaluate_integral(n,t,val[0],val[1],aver_start,&stddev);
1111       printf("Integral %10.3f +/- %10.5f\n",sum,stddev);
1112     }
1113     else {
1114       for(s=0; s<nset; s++) {
1115         sum = evaluate_integral(n,t,val[s],NULL,aver_start,&stddev);
1116         printf("Integral %d  %10.5f  +/- %10.5f\n",s+1,sum,stddev);
1117       }
1118     }
1119   }
1120   if (fitfile) {
1121     out_fit = ffopen(fitfile,"w");
1122     if (bXYdy && nset>=2) {
1123       do_fit(out_fit,0,TRUE,n,t,val,npargs,ppa,oenv);
1124     } else {
1125       for(s=0; s<nset; s++)
1126         do_fit(out_fit,s,FALSE,n,t,val,npargs,ppa,oenv);
1127     }
1128     ffclose(out_fit);
1129   }
1130
1131   printf("                                      std. dev.    relative deviation of\n");
1132   printf("                       standard       ---------   cumulants from those of\n");
1133   printf("set      average       deviation      sqrt(n-1)   a Gaussian distribition\n");
1134   printf("                                                      cum. 3   cum. 4\n");
1135   snew(av,nset);
1136   snew(sig,nset);
1137   for(s=0; (s<nset); s++) {
1138     cum1 = 0;
1139     cum2 = 0;
1140     cum3 = 0;
1141     cum4 = 0;
1142     for(i=0; (i<n); i++)
1143       cum1 += val[s][i];
1144     cum1 /= n;
1145     for(i=0; (i<n); i++) {
1146       db = val[s][i]-cum1;
1147       cum2 += db*db;
1148       cum3 += db*db*db;
1149       cum4 += db*db*db*db;
1150     }
1151     cum2  /= n;
1152     cum3  /= n;
1153     cum4  /= n;
1154     av[s]  = cum1;
1155     sig[s] = sqrt(cum2);
1156     if (n > 1)
1157       error = sqrt(cum2/(n-1));
1158     else
1159       error = 0;
1160     printf("SS%d  %13.6e   %12.6e   %12.6e      %6.3f   %6.3f\n",
1161            s+1,av[s],sig[s],error,
1162            sig[s] ? cum3/(sig[s]*sig[s]*sig[s]*sqrt(8/M_PI)) : 0,
1163            sig[s] ? cum4/(sig[s]*sig[s]*sig[s]*sig[s]*3)-1 : 0);
1164   }
1165   printf("\n");
1166
1167   if (filtlen)
1168     filter(filtlen,n,nset,val,dt,oenv);
1169
1170   if (msdfile) {
1171     out=xvgropen(msdfile,"Mean square displacement",
1172                  "time","MSD (nm\\S2\\N)",oenv);
1173     nlast = (int)(n*frac);
1174     for(s=0; s<nset; s++) {
1175       for(j=0; j<=nlast; j++) {
1176         if (j % 100 == 0)
1177           fprintf(stderr,"\r%d",j);
1178         tot=0;
1179         for(i=0; i<n-j; i++)
1180           tot += sqr(val[s][i]-val[s][i+j]);
1181         tot /= (real)(n-j);
1182         fprintf(out," %g %8g\n",dt*j,tot);
1183       }
1184       if (s<nset-1)
1185         fprintf(out,"&\n");
1186     }
1187     ffclose(out);
1188     fprintf(stderr,"\r%d, time=%g\n",j-1,(j-1)*dt);
1189   }
1190   if (ccfile)
1191     plot_coscont(ccfile,n,nset,val,oenv);
1192
1193   if (distfile)
1194     histogram(distfile,binwidth,n,nset,val,oenv);
1195   if (avfile)
1196     average(avfile,nenum(avbar_opt),n,nset,val,t);
1197   if (eefile)
1198     estimate_error(eefile,nb_min,resol,n,nset,av,sig,val,dt,
1199                    bEeFitAc,bEESEF,bEENLC,oenv);
1200   if (balfile)
1201       do_ballistic(balfile,n,t,val,nset,balTime,nBalExp,bDer,oenv);
1202   if (gemfile)
1203       do_geminate(gemfile,n,t,val,nset,diffusion,logAfterTime,rcut,balTime,oenv);
1204   if (bPower)
1205     power_fit(n,nset,val,t);
1206   if (acfile) {
1207     if (bSubAv)
1208       for(s=0; s<nset; s++)
1209         for(i=0; i<n; i++)
1210           val[s][i] -= av[s];
1211     do_autocorr(acfile,oenv,"Autocorrelation",n,nset,val,dt,
1212                 eacNormal,bAverCorr);
1213   }
1214   if (bRegression)
1215       regression_analysis(n,bXYdy,t,nset,val);
1216
1217   if (bLuzar)
1218     luzar_correl(n,t,nset,val,temp,bXYdy,fit_start,smooth_tail_start,oenv);
1219
1220   view_all(oenv,NFILE, fnm);
1221
1222   thanx(stderr);
1223
1224   return 0;
1225 }
1226