src/gmxlib/index.c

   1 /*
   2  *
   3  *                This source code is part of
   4  *
   5  *                 G   R   O   M   A   C   S
   6  *
   7  *          GROningen MAchine for Chemical Simulations
   8  *
   9  *                        VERSION 3.2.0
  10  * Written by David van der Spoel, Erik Lindahl, Berk Hess, and others.
  11  * Copyright (c) 1991-2000, University of Groningen, The Netherlands.
  12  * Copyright (c) 2001-2004, The GROMACS development team,
  13  * check out http://www.gromacs.org for more information.
  14
  15  * This program is free software; you can redistribute it and/or
  16  * modify it under the terms of the GNU General Public License
  17  * as published by the Free Software Foundation; either version 2
  18  * of the License, or (at your option) any later version.
  19  *
  20  * If you want to redistribute modifications, please consider that
  21  * scientific software is very special. Version control is crucial -
  22  * bugs must be traceable. We will be happy to consider code for
  23  * inclusion in the official distribution, but derived work must not
  24  * be called official GROMACS. Details are found in the README & COPYING
  25  * files - if they are missing, get the official version at www.gromacs.org.
  26  *
  27  * To help us fund GROMACS development, we humbly ask that you cite
  28  * the papers on the package - you can find them in the top README file.
  29  *
  30  * For more info, check our website at http://www.gromacs.org
  31  *
  32  * And Hey:
  33  * GROningen Mixture of Alchemy and Childrens' Stories
  34  */
  35 #ifdef HAVE_CONFIG_H
  36 #include <config.h>
  37 #endif
  38
  39 #include <ctype.h>
  40 #include <string.h>
  41 #include "sysstuff.h"
  42 #include "strdb.h"
  43 #include "futil.h"
  44 #include "macros.h"
  45 #include "names.h"
  46 #include "string2.h"
  47 #include "statutil.h"
  48 #include "confio.h"
  49 #include "main.h"
  50 #include "copyrite.h"
  51 #include "typedefs.h"
  52 #include "smalloc.h"
  53 #include "invblock.h"
  54 #include "macros.h"
  55 #include "index.h"
  56 #include "txtdump.h"
  57 #include "gmxfio.h"
  58
  59 typedef enum { etOther, etProt, etDNA, erestNR } eRestp;
  60 static const char *ResTP[erestNR] = { "OTHER", "PROTEIN", "DNA" };
  61
  62 static const char   *Sugars[]     = { "A", "T", "G", "C", "U" };
  63 #define  NDNA asize(Sugars)
  64
  65 static const char *Negate[] = { "SOL" };
  66 #define  NNEGATE asize(Negate)
  67
  68 static bool gmx_ask_yesno(bool bASK)
  69 {
  70   char c;
  71
  72   if (bASK) {
  73     do {
  74       c=toupper(fgetc(stdin));
  75     } while ((c != 'Y') && (c != 'N'));
  76
  77     return (c == 'Y');
  78   }
  79   else
  80     return FALSE;
  81 }
  82
  83 t_blocka *new_blocka(void)
  84 {
  85   t_blocka *block;
  86
  87   snew(block,1);
  88   snew(block->index,1);
  89
  90   return block;
  91 }
  92
  93 void write_index(const char *outf, t_blocka *b,char **gnames)
  94 {
  95   FILE *out;
  96   int  i,j,k;
  97
  98   out=gmx_fio_fopen(outf,"w");
  99   /* fprintf(out,"%5d  %5d\n",b->nr,b->nra); */
 100   for(i=0; (i<b->nr); i++) {
 101     fprintf(out,"[ %s ]\n",gnames[i]);
 102     for(k=0,j=b->index[i]; j<b->index[i+1]; j++,k++) {
 103       fprintf(out,"%4d ",b->a[j]+1);
 104       if ((k % 15) == 14)
 105         fprintf(out,"\n");
 106     }
 107     fprintf(out,"\n");
 108   }
 109   gmx_fio_fclose(out);
 110 }
 111
 112 void add_grp(t_blocka *b,char ***gnames,int nra,atom_id a[],const char *name)
 113 {
 114   int i;
 115
 116   srenew(b->index,b->nr+2);
 117   srenew(*gnames,b->nr+1);
 118   (*gnames)[b->nr]=strdup(name);
 119
 120   srenew(b->a,b->nra+nra);
 121   for(i=0; (i<nra); i++)
 122     b->a[b->nra++]=a[i];
 123   b->nr++;
 124   b->index[b->nr]=b->nra;
 125 }
 126
 127 /* compare index in `a' with group in `b' at `index',
 128    when `index'<0 it is relative to end of `b' */
 129 static bool grp_cmp(t_blocka *b, int nra, atom_id a[], int index)
 130 {
 131   int i;
 132
 133   if (index < 0)
 134     index = b->nr-1+index;
 135   if (index >= b->nr)
 136     gmx_fatal(FARGS,"no such index group %d in t_blocka (nr=%d)",index,b->nr);
 137   /* compare sizes */
 138   if ( nra != b->index[index+1] - b->index[index] )
 139     return FALSE;
 140   for(i=0; i<nra; i++)
 141     if ( a[i] != b->a[b->index[index]+i] )
 142       return FALSE;
 143   return TRUE;
 144 }
 145
 146 static void p_status(int nres,eRestp restp[],bool bVerb)
 147 {
 148   int i,j,ntp[erestNR];
 149
 150   for(i=0; (i<erestNR); i++)
 151     ntp[i]=0;
 152   for(j=0; (j<nres); j++)
 153     ntp[restp[j]]++;
 154
 155   if (bVerb)
 156     for(i=0; (i<erestNR); i++)
 157       printf("There are: %5d %10s residues\n",ntp[i],ResTP[i]);
 158 }
 159
 160 atom_id *mk_aid(t_atoms *atoms,eRestp restp[],eRestp res,int *nra,
 161                 bool bTrue)
 162 /* Make an array of atom_ids for all atoms with:
 163  * (restp[i] == res) == bTrue
 164  */
 165 {
 166   atom_id *a;
 167   int     i;
 168
 169   snew(a,atoms->nr);
 170   *nra=0;
 171   for(i=0; (i<atoms->nr); i++)
 172     if ((restp[atoms->atom[i].resind] == res) == bTrue)
 173       a[(*nra)++]=i;
 174
 175   return a;
 176 }
 177
 178 typedef struct {
 179   char *rname;
 180   bool bNeg;
 181   char *gname;
 182 } restp_t;
 183
 184 static void analyse_other(eRestp Restp[],t_atoms *atoms,
 185                           t_blocka *gb,char ***gn,bool bASK,bool bVerb)
 186 {
 187   restp_t *restp=NULL;
 188   char **attp=NULL;
 189   char *rname,*aname;
 190   atom_id *other_ndx,*aid,*aaid;
 191   int  i,j,k,l,resind,naid,naaid,natp,nrestp=0;
 192
 193   for(i=0; (i<atoms->nres); i++)
 194     if (Restp[i] == etOther)
 195       break;
 196   if (i < atoms->nres) {
 197     /* we have others */
 198     if (bVerb)
 199       printf("Analysing Other...\n");
 200     snew(other_ndx,atoms->nr);
 201     for(k=0; (k<atoms->nr); k++) {
 202       resind = atoms->atom[k].resind;
 203       rname = *atoms->resinfo[resind].name;
 204       if (Restp[resind] == etOther) {
 205         for(l=0; (l<nrestp); l++)
 206           if (strcmp(restp[l].rname,rname) == 0)
 207             break;
 208         if (l==nrestp) {
 209           srenew(restp,nrestp+1);
 210           restp[nrestp].rname = strdup(rname);
 211           restp[nrestp].bNeg  = FALSE;
 212           restp[nrestp].gname = strdup(rname);
 213           nrestp++;
 214           for(i=0; i<NNEGATE; i++) {
 215             if (strcmp(rname,Negate[i]) == 0) {
 216               srenew(restp,nrestp+1);
 217               restp[nrestp].rname = strdup(rname);
 218               restp[nrestp].bNeg  = TRUE;
 219               snew(restp[nrestp].gname,4+strlen(rname)+1);
 220               sprintf(restp[nrestp].gname,"%s%s","non-",rname);
 221               nrestp++;
 222             }
 223           }
 224         }
 225       }
 226     }
 227     for(i=0; (i<nrestp); i++) {
 228       snew(aid,atoms->nr);
 229       naid=0;
 230       for(j=0; (j<atoms->nr); j++) {
 231         rname = *atoms->resinfo[atoms->atom[j].resind].name;
 232         if ((strcmp(restp[i].rname,rname) == 0 && !restp[i].bNeg) ||
 233             (strcmp(restp[i].rname,rname) != 0 &&  restp[i].bNeg)) {
 234           aid[naid++] = j;
 235         }
 236       }
 237       add_grp(gb,gn,naid,aid,restp[i].gname);
 238       if (bASK) {
 239         printf("split %s into atoms (y/n) ? ",restp[i].gname);
 240         fflush(stdout);
 241         if (gmx_ask_yesno(bASK)) {
 242           natp=0;
 243           for(k=0; (k<naid); k++) {
 244             aname=*atoms->atomname[aid[k]];
 245             for(l=0; (l<natp); l++)
 246               if (strcmp(aname,attp[l]) == 0)
 247                 break;
 248             if (l == natp) {
 249               srenew(attp,++natp);
 250               attp[natp-1]=aname;
 251             }
 252           }
 253           if (natp > 1) {
 254             for(l=0; (l<natp); l++) {
 255               snew(aaid,naid);
 256               naaid=0;
 257               for(k=0; (k<naid); k++) {
 258                 aname=*atoms->atomname[aid[k]];
 259                 if (strcmp(aname,attp[l])==0)
 260                   aaid[naaid++]=aid[k];
 261               }
 262               add_grp(gb,gn,naaid,aaid,attp[l]);
 263               sfree(aaid);
 264             }
 265           }
 266           sfree(attp);
 267           attp=NULL;
 268         }
 269         sfree(aid);
 270       }
 271     }
 272     sfree(other_ndx);
 273   }
 274 }
 275
 276 static void analyse_prot(eRestp restp[],t_atoms *atoms,
 277                          t_blocka *gb,char ***gn,bool bASK,bool bVerb)
 278 {
 279   /* atomnames to be used in constructing index groups: */
 280   static const char *pnoh[]    = { "H" };
 281   static const char *pnodum[]  = { "MN1",  "MN2",  "MCB1", "MCB2", "MCG1", "MCG2",
 282                              "MCD1", "MCD2", "MCE1", "MCE2", "MNZ1", "MNZ2" };
 283   static const char *calpha[]  = { "CA" };
 284   static const char *bb[]      = { "N","CA","C" };
 285   static const char *mc[]      = { "N","CA","C","O","O1","O2","OXT" };
 286   static const char *mcb[]     = { "N","CA","CB","C","O","O1","O2","OT","OXT" };
 287   static const char *mch[]     = { "N","CA","C","O","O1","O2","OT","OXT",
 288                              "H1","H2","H3","H" };
 289   /* array of arrays of atomnames: */
 290   static const char **chains[] = { NULL,pnoh,calpha,bb,mc,mcb,mch,mch,mch,pnodum };
 291 #define NCH asize(chains)
 292   /* array of sizes of arrays of atomnames: */
 293   const int       sizes[NCH] = {
 294     0, asize(pnoh), asize(calpha), asize(bb),
 295     asize(mc), asize(mcb), asize(mch), asize(mch), asize(mch), asize(pnodum)
 296   };
 297   /* descriptive names of index groups */
 298   const char   *ch_name[NCH] = {
 299     "Protein", "Protein-H", "C-alpha", "Backbone",
 300     "MainChain", "MainChain+Cb", "MainChain+H", "SideChain", "SideChain-H",
 301     "Prot-Masses"
 302   };
 303   /* construct index group containing (TRUE) or excluding (FALSE)
 304      given atom names */
 305   const bool complement[NCH] = {
 306     TRUE, TRUE, FALSE, FALSE, FALSE, FALSE, FALSE, TRUE, TRUE, TRUE
 307   };
 308   const int  wholename[NCH]  = { -1, 0,-1,-1,-1,-1,-1,-1, 11,-1 };
 309   /* the index in wholename gives the first item in the arrays of
 310    * atomtypes that should be tested with 'strncasecmp' in stead of
 311    * strcasecmp, or -1 if all items should be tested with strcasecmp
 312    * This is comparable to using a '*' wildcard at the end of specific
 313    * atom names, but that is more involved to implement...
 314    */
 315   /* only add index group if it differs from the specified one,
 316      specify -1 to always add group */
 317   const int compareto[NCH] = { -1,-1,-1,-1,-1,-1,-1,-1,-1, 0 };
 318
 319   int     n,j;
 320   atom_id *aid;
 321   int     nra,nnpres,npres;
 322   bool    match;
 323   char    ndx_name[STRLEN],*atnm;
 324   int i;
 325
 326   if (bVerb)
 327     printf("Analysing Protein...\n");
 328   snew(aid,atoms->nr);
 329
 330   /* calculate the number of protein residues */
 331   npres=0;
 332   for(i=0; (i<atoms->nres); i++)
 333     if (restp[i] == etProt)
 334       npres++;
 335
 336   /* find matching or complement atoms */
 337   for(i=0; (i<(int)NCH); i++) {
 338     nra=0;
 339     for(n=0; (n<atoms->nr); n++) {
 340       if (restp[atoms->atom[n].resind] == etProt) {
 341         match=FALSE;
 342         for(j=0; (j<sizes[i]); j++) {
 343           /* skip digits at beginning of atomname, e.g. 1H */
 344           atnm=*atoms->atomname[n];
 345           while (isdigit(atnm[0]))
 346             atnm++;
 347           if ( (wholename[i]==-1) || (j<wholename[i]) ) {
 348             if (strcasecmp(chains[i][j],atnm) == 0)
 349               match=TRUE;
 350           } else {
 351             if (strncasecmp(chains[i][j],atnm,strlen(chains[i][j])) == 0)
 352               match=TRUE;
 353           }
 354         }
 355         if (match != complement[i])
 356           aid[nra++]=n;
 357       }
 358     }
 359     /* if we want to add this group always or it differs from previous
 360        group, add it: */
 361     if ( compareto[i] == -1 || !grp_cmp(gb,nra,aid,compareto[i]-i) )
 362       add_grp(gb,gn,nra,aid,ch_name[i]);
 363   }
 364
 365   if (bASK) {
 366     for(i=0; (i<(int)NCH); i++) {
 367       printf("Split %12s into %5d residues (y/n) ? ",ch_name[i],npres);
 368       if (gmx_ask_yesno(bASK)) {
 369         int resind;
 370         nra = 0;
 371         for(n=0;((atoms->atom[n].resind < npres) && (n<atoms->nr));) {
 372           resind = atoms->atom[n].resind;
 373           for(;((atoms->atom[n].resind==resind) && (n<atoms->nr));n++) {
 374             match=FALSE;
 375             for(j=0;(j<sizes[i]); j++)
 376               if (strcasecmp(chains[i][j],*atoms->atomname[n]) == 0)
 377                 match=TRUE;
 378             if (match != complement[i])
 379               aid[nra++]=n;
 380           }
 381           /* copy the residuename to the tail of the groupname */
 382           if (nra > 0) {
 383             t_resinfo *ri;
 384             ri = &atoms->resinfo[resind];
 385             sprintf(ndx_name,"%s_%s%d%c",
 386                     ch_name[i],*ri->name,ri->nr,ri->ic==' ' ? '\0' : ri->ic);
 387             add_grp(gb,gn,nra,aid,ndx_name);
 388             nra = 0;
 389           }
 390         }
 391       }
 392     }
 393     printf("Make group with sidechain and C=O swapped (y/n) ? ");
 394     if (gmx_ask_yesno(bASK)) {
 395       /* Make swap sidechain C=O index */
 396       int resind,hold;
 397       nra = 0;
 398       for(n=0;((atoms->atom[n].resind < npres) && (n<atoms->nr));) {
 399         resind = atoms->atom[n].resind;
 400         hold  = -1;
 401         for(;((atoms->atom[n].resind==resind) && (n<atoms->nr));n++)
 402           if (strcmp("CA",*atoms->atomname[n]) == 0) {
 403             aid[nra++]=n;
 404             hold=nra;
 405             nra+=2;
 406           } else if (strcmp("C",*atoms->atomname[n]) == 0) {
 407             if (hold == -1)
 408               gmx_incons("Atom naming problem");
 409             aid[hold]=n;
 410           } else if (strcmp("O",*atoms->atomname[n]) == 0) {
 411             if (hold == -1)
 412               gmx_incons("Atom naming problem");
 413             aid[hold+1]=n;
 414           } else if (strcmp("O1",*atoms->atomname[n]) == 0) {
 415             if (hold == -1)
 416               gmx_incons("Atom naming problem");
 417             aid[hold+1]=n;
 418           } else
 419             aid[nra++]=n;
 420       }
 421       /* copy the residuename to the tail of the groupname */
 422       if (nra > 0) {
 423         add_grp(gb,gn,nra,aid,"SwapSC-CO");
 424         nra = 0;
 425       }
 426     }
 427   }
 428   sfree(aid);
 429 }
 430
 431 static void analyse_dna(eRestp restp[],t_atoms *atoms,
 432                         t_blocka *gb,char ***gn,bool bASK,bool bVerb)
 433 {
 434   if (bVerb)
 435     printf("Analysing DNA... (not really)\n");
 436   if (debug)
 437     printf("eRestp %p; atoms %p; gb %p; gn %p; bASK %s; bASK %s",
 438            (void *)restp, (void *)atoms, (void *)gb, (void *)gn,
 439            bool_names[bASK], bool_names[bVerb]);
 440 }
 441
 442 t_aa_names *get_aa_names(void)
 443 {
 444   /* Read the database in aminoacids.dat */
 445   t_aa_names *aan;
 446
 447   snew(aan,1);
 448
 449   aan->n = get_strings("aminoacids.dat",&(aan->aa));
 450   /* qsort(aan->aa,aan->n,sizeof(aan->aa[0]),strcmp);*/
 451
 452   return aan;
 453 }
 454
 455 bool is_protein(t_aa_names *aan,char *resnm)
 456 {
 457   /* gives true if resnm occurs in aminoacids.dat */
 458   int i;
 459
 460   for(i=0; (i<aan->n); i++)
 461     if (strcasecmp(aan->aa[i],resnm) == 0)
 462       return TRUE;
 463
 464   return FALSE;
 465 }
 466
 467 void done_aa_names(t_aa_names **aan)
 468 {
 469   /* Free memory */
 470   int i;
 471
 472   for(i=0; (i<(*aan)->n); i++)
 473     sfree((*aan)->aa[i]);
 474   sfree((*aan)->aa);
 475   sfree(*aan);
 476   *aan = NULL;
 477 }
 478
 479 void analyse(t_atoms *atoms,t_blocka *gb,char ***gn,bool bASK,bool bVerb)
 480 {
 481   t_aa_names *aan;
 482   eRestp  *restp;
 483   char    *resnm;
 484   atom_id *aid;
 485   int     nra;
 486   int     i;
 487   size_t  j;
 488
 489   if (bVerb)
 490     printf("Analysing residue names:\n");
 491   snew(restp,atoms->nres);
 492   aid=mk_aid(atoms,restp,etOther,&nra,TRUE);
 493   add_grp(gb,gn,nra,aid,"System");
 494   sfree(aid);
 495
 496   aan = get_aa_names();
 497   for(i=0; (i<atoms->nres); i++) {
 498     resnm = *atoms->resinfo[i].name;
 499     if ((restp[i] == etOther) && is_protein(aan,resnm))
 500       restp[i] = etProt;
 501     if (restp[i] == etOther)
 502       for(j=0; (j<NDNA);  j++) {
 503         if (strcasecmp(Sugars[j],resnm) == 0)
 504           restp[i] = etDNA;
 505       }
 506   }
 507   p_status(atoms->nres,restp,bVerb);
 508   done_aa_names(&aan);
 509
 510   /* Protein */
 511   aid=mk_aid(atoms,restp,etProt,&nra,TRUE);
 512   if (nra > 0)
 513     analyse_prot(restp,atoms,gb,gn,bASK,bVerb);
 514
 515   sfree(aid);
 516
 517   /* Non-Protein */
 518   aid=mk_aid(atoms,restp,etProt,&nra,FALSE);
 519   if ((nra > 0) && (nra < atoms->nr))
 520     add_grp(gb,gn,nra,aid,"non-Protein");
 521   sfree(aid);
 522
 523   /* DNA */
 524   aid=mk_aid(atoms,restp,etDNA,&nra,TRUE);
 525   if (nra > 0) {
 526     add_grp(gb,gn,nra,aid,"DNA");
 527     analyse_dna(restp,atoms,gb,gn,bASK,bVerb);
 528   }
 529   sfree(aid);
 530
 531   /* Other */
 532   analyse_other(restp,atoms,gb,gn,bASK,bVerb);
 533
 534   sfree(restp);
 535 }
 536
 537 void check_index(char *gname,int n,atom_id index[],char *traj,int natoms)
 538 {
 539   int i;
 540
 541   for(i=0; i<n; i++)
 542     if (index[i] >= natoms)
 543       gmx_fatal(FARGS,"%s atom number (index[%d]=%d) is larger than the number of atoms in %s (%d)",
 544                   gname ? gname : "Index",i+1, index[i]+1,
 545                   traj ? traj : "the trajectory",natoms);
 546     else if (index[i] < 0)
 547       gmx_fatal(FARGS,"%s atom number (index[%d]=%d) is less than zero",
 548                 gname ? gname : "Index",i+1, index[i]+1);
 549 }
 550
 551 t_blocka *init_index(const char *gfile, char ***grpname)
 552 {
 553   FILE     *in;
 554   t_blocka  *b;
 555   int      a,maxentries;
 556   int      i,j,ng,nread;
 557   char     line[STRLEN],*pt,str[STRLEN];
 558
 559   in=gmx_fio_fopen(gfile,"r");
 560   snew(b,1);
 561   get_a_line(in,line,STRLEN);
 562   if ( line[0]=='[' ) {
 563     /* new format */
 564     b->nr=0;
 565     b->index=NULL;
 566     b->nra=0;
 567     b->a=NULL;
 568     *grpname=NULL;
 569     maxentries=0;
 570     do {
 571       if (get_header(line,str)) {
 572         b->nr++;
 573         srenew(b->index,b->nr+1);
 574         srenew(*grpname,b->nr);
 575         if (b->nr==1)
 576           b->index[0]=0;
 577         b->index[b->nr]=b->index[b->nr-1];
 578         (*grpname)[b->nr-1]=strdup(str);
 579       } else {
 580         pt=line;
 581         while ((i=sscanf(pt,"%s",str)) == 1) {
 582           i=b->index[b->nr];
 583           if (i>=maxentries) {
 584             maxentries+=1024;
 585             srenew(b->a,maxentries);
 586           }
 587           b->a[i]=strtol(str, NULL, 10)-1;
 588           b->index[b->nr]++;
 589           (b->nra)++;
 590           pt=strstr(pt,str)+strlen(str);
 591         }
 592       }
 593     } while (get_a_line(in,line,STRLEN));
 594   }
 595   else {
 596     /* old format */
 597     sscanf(line,"%d%d",&b->nr,&b->nra);
 598     snew(b->index,b->nr+1);
 599     snew(*grpname,b->nr);
 600     b->index[0]=0;
 601     snew(b->a,b->nra);
 602     for (i=0; (i<b->nr); i++) {
 603       nread=fscanf(in,"%s%d",str,&ng);
 604       (*grpname)[i]=strdup(str);
 605       b->index[i+1]=b->index[i]+ng;
 606       if (b->index[i+1] > b->nra)
 607         gmx_fatal(FARGS,"Something wrong in your indexfile at group %s",str);
 608       for(j=0; (j<ng); j++) {
 609         nread=fscanf(in,"%d",&a);
 610         b->a[b->index[i]+j]=a;
 611       }
 612     }
 613   }
 614   gmx_fio_fclose(in);
 615
 616   for(i=0; (i<b->nr); i++) {
 617     for(j=b->index[i]; (j<b->index[i+1]); j++) {
 618       if (b->a[j] < 0)
 619         fprintf(stderr,"\nWARNING: negative index %d in group %s\n\n",
 620                 b->a[j],(*grpname)[i]);
 621     }
 622   }
 623
 624   return b;
 625 }
 626
 627 static void minstring(char *str)
 628 {
 629   int i;
 630
 631   for (i=0; (i < (int)strlen(str)); i++)
 632     if (str[i]=='-')
 633       str[i]='_';
 634 }
 635
 636 int find_group(char s[], int ngrps, char **grpname)
 637 {
 638   int aa, i, n;
 639   char string[STRLEN];
 640   bool bMultiple;
 641
 642   bMultiple = FALSE;
 643   n = strlen(s);
 644   aa=NOTSET;
 645   /* first look for whole name match */
 646   if (aa==NOTSET)
 647     for(i=0; i<ngrps; i++)
 648       if (strcasecmp_min(s,grpname[i])==0) {
 649         if(aa!=NOTSET)
 650           bMultiple = TRUE;
 651         aa=i;
 652       }
 653   /* second look for first string match */
 654   if (aa==NOTSET)
 655     for(i=0; i<ngrps; i++)
 656       if (strncasecmp_min(s,grpname[i],n)==0) {
 657         if(aa!=NOTSET)
 658           bMultiple = TRUE;
 659         aa=i;
 660       }
 661   /* last look for arbitrary substring match */
 662   if (aa==NOTSET) {
 663     upstring(s);
 664     minstring(s);
 665     for(i=0; i<ngrps; i++) {
 666       strcpy(string, grpname[i]);
 667       upstring(string);
 668       minstring(string);
 669       if (strstr(string,s)!=NULL) {
 670         if(aa!=NOTSET)
 671           bMultiple = TRUE;
 672         aa=i;
 673       }
 674     }
 675   }
 676   if (bMultiple) {
 677     printf("Error: Multiple groups '%s' selected\n", s);
 678     aa=NOTSET;
 679   }
 680   return aa;
 681 }
 682
 683 static int qgroup(int *a, int ngrps, char **grpname)
 684 {
 685     char s[STRLEN];
 686     int  aa;
 687     bool bInRange;
 688     char *end;
 689
 690     do {
 691         fprintf(stderr,"Select a group: ");
 692         do {
 693             if ( scanf("%s",s)!=1 )
 694                 gmx_fatal(FARGS,"Cannot read from input");
 695             trim(s); /* remove spaces */
 696         } while (strlen(s)==0);
 697         aa = strtol(s, &end, 10);
 698         if (aa==0 && end[0] != '\0') /* string entered */
 699             aa = find_group(s, ngrps, grpname);
 700         bInRange = (aa >= 0 && aa < ngrps);
 701         if (!bInRange)
 702             printf("Error: No such group '%s'\n", s);
 703     } while (!bInRange);
 704     printf("Selected %d: '%s'\n", aa, grpname[aa]);
 705     *a = aa;
 706     return aa;
 707 }
 708
 709 static void rd_groups(t_blocka *grps,char **grpname,char *gnames[],
 710                       int ngrps,int isize[],atom_id *index[],int grpnr[])
 711 {
 712   int i,j,gnr1;
 713
 714   if (grps->nr==0)
 715     gmx_fatal(FARGS,"Error: no groups in indexfile");
 716   for(i=0; (i<grps->nr); i++)
 717     fprintf(stderr,"Group %5d (%12s) has %5d elements\n",i,grpname[i],
 718            grps->index[i+1]-grps->index[i]);
 719   for(i=0; (i<ngrps); i++) {
 720     if (grps->nr > 1)
 721       do {
 722         gnr1=qgroup(&grpnr[i], grps->nr, grpname);
 723         if ((gnr1<0) || (gnr1>=grps->nr))
 724           fprintf(stderr,"Select between %d and %d.\n",0,grps->nr-1);
 725       } while ((gnr1<0) || (gnr1>=grps->nr));
 726     else {
 727       fprintf(stderr,"There is one group in the index\n");
 728       gnr1=0;
 729     }
 730     gnames[i]=strdup(grpname[gnr1]);
 731     isize[i]=grps->index[gnr1+1]-grps->index[gnr1];
 732     snew(index[i],isize[i]);
 733     for(j=0; (j<isize[i]); j++)
 734       index[i][j]=grps->a[grps->index[gnr1]+j];
 735   }
 736 }
 737
 738 void rd_index(const char *statfile,int ngrps,int isize[],
 739               atom_id *index[],char *grpnames[])
 740 {
 741   char    **gnames;
 742   t_blocka *grps;
 743   int     *grpnr;
 744
 745   snew(grpnr,ngrps);
 746   if (!statfile)
 747     gmx_fatal(FARGS,"No index file specified");
 748   grps=init_index(statfile,&gnames);
 749   rd_groups(grps,gnames,grpnames,ngrps,isize,index,grpnr);
 750 }
 751
 752 void rd_index_nrs(char *statfile,int ngrps,int isize[],
 753                   atom_id *index[],char *grpnames[],int grpnr[])
 754 {
 755   char    **gnames;
 756   t_blocka *grps;
 757
 758   if (!statfile)
 759     gmx_fatal(FARGS,"No index file specified");
 760   grps=init_index(statfile,&gnames);
 761
 762   rd_groups(grps,gnames,grpnames,ngrps,isize,index,grpnr);
 763 }
 764
 765 void get_index(t_atoms *atoms, const char *fnm, int ngrps,
 766                int isize[], atom_id *index[],char *grpnames[])
 767 {
 768   char    ***gnames;
 769   t_blocka *grps = NULL;
 770   int     *grpnr;
 771
 772   snew(grpnr,ngrps);
 773   snew(gnames,1);
 774   if (fnm != NULL) {
 775     grps=init_index(fnm,gnames);
 776   }
 777   else if (atoms) {
 778     snew(grps,1);
 779     snew(grps->index,1);
 780     analyse(atoms,grps,gnames,FALSE,FALSE);
 781   }
 782   else
 783     gmx_incons("You need to supply a valid atoms structure or a valid index file name");
 784
 785   rd_groups(grps,*gnames,grpnames,ngrps,isize,index,grpnr);
 786 }
 787
 788 t_cluster_ndx *cluster_index(FILE *fplog,const char *ndx)
 789 {
 790   t_cluster_ndx *c;
 791   int i;
 792
 793   snew(c,1);
 794   c->clust     = init_index(ndx,&c->grpname);
 795   c->maxframe = -1;
 796   for(i=0; (i<c->clust->nra); i++)
 797     c->maxframe = max(c->maxframe,c->clust->a[i]);
 798   fprintf(fplog ? fplog : stdout,
 799           "There are %d clusters containing %d structures, highest framenr is %d\n",
 800           c->clust->nr,c->clust->nra,c->maxframe);
 801   if (debug) {
 802     pr_blocka(debug,0,"clust",c->clust,TRUE);
 803     for(i=0; (i<c->clust->nra); i++)
 804       if ((c->clust->a[i] < 0) || (c->clust->a[i] > c->maxframe))
 805         gmx_fatal(FARGS,"Range check error for c->clust->a[%d] = %d\n"
 806                   "should be within 0 and %d",i,c->clust->a[i],c->maxframe+1);
 807   }
 808   c->inv_clust=make_invblocka(c->clust,c->maxframe);
 809
 810   return c;
 811 }
 812