RubyGems - apriori - Versions diffs - 0.2.1 - Mend

apriori 0.2.1

Files changed (122) hide show

data/History.txt +16 -0
data/License.txt +20 -0
data/Manifest.txt +121 -0
data/README.txt +149 -0
data/Rakefile +15 -0
data/TODO.txt +60 -0
data/attic/c_ext_test1/MyTest/MyTest.c +23 -0
data/attic/c_ext_test1/MyTest/extconf.rb +11 -0
data/attic/c_ext_test1/mytest.rb +10 -0
data/attic/test.c +12 -0
data/config/hoe.rb +81 -0
data/config/requirements.rb +29 -0
data/examples/01_simple_example.rb +32 -0
data/examples/02_small_file_example.rb +17 -0
data/examples/03_large_file_example.rb +22 -0
data/examples/test_data/market_basket_basic_test.dat +9 -0
data/ext/Apriori.c +149 -0
data/ext/Makefile +149 -0
data/ext/apriori/doc/apriori.html +1301 -0
data/ext/apriori/doc/arem.gp +68 -0
data/ext/apriori/doc/c_rev.gp +89 -0
data/ext/apriori/doc/chi2.tex +156 -0
data/ext/apriori/doc/copying +504 -0
data/ext/apriori/doc/line.gif +0 -0
data/ext/apriori/doc/uparrow.gif +0 -0
data/ext/apriori/ex/flg2set +15 -0
data/ext/apriori/ex/hdr2set +13 -0
data/ext/apriori/ex/readme +71 -0
data/ext/apriori/ex/row2set +7 -0
data/ext/apriori/ex/rulesort +24 -0
data/ext/apriori/ex/tab2set +9 -0
data/ext/apriori/ex/test.app +2 -0
data/ext/apriori/ex/test.rul +9 -0
data/ext/apriori/ex/test1.rul +43 -0
data/ext/apriori/ex/test1.tab +10 -0
data/ext/apriori/ex/test2.tab +10 -0
data/ext/apriori/ex/test3.tab +30 -0
data/ext/apriori/ex/test4.tab +11 -0
data/ext/apriori/ex/test5.tab +39 -0
data/ext/apriori/ex/tid2set +23 -0
data/ext/apriori/ex/xhdr2set +33 -0
data/ext/apriori/src/apriori.c +750 -0
data/ext/apriori/src/apriori.dsp +120 -0
data/ext/apriori/src/apriori.dsw +29 -0
data/ext/apriori/src/apriori.mak +99 -0
data/ext/apriori/src/istree.c +1411 -0
data/ext/apriori/src/istree.h +160 -0
data/ext/apriori/src/makefile +105 -0
data/ext/apriori/src/tract.c +870 -0
data/ext/apriori/src/tract.h +261 -0
data/ext/apriori_wrapper.c +757 -0
data/ext/apriori_wrapper.h +10 -0
data/ext/extconf.rb +32 -0
data/ext/math/doc/copying +504 -0
data/ext/math/src/chi2.c +151 -0
data/ext/math/src/chi2.h +27 -0
data/ext/math/src/choose.c +71 -0
data/ext/math/src/choose.h +16 -0
data/ext/math/src/gamma.c +446 -0
data/ext/math/src/gamma.h +39 -0
data/ext/math/src/intexp.c +35 -0
data/ext/math/src/intexp.h +15 -0
data/ext/math/src/makefile +164 -0
data/ext/math/src/math.mak +48 -0
data/ext/math/src/normal.c +387 -0
data/ext/math/src/normal.h +44 -0
data/ext/math/src/radfn.c +113 -0
data/ext/math/src/radfn.h +34 -0
data/ext/math/src/zeta.c +49 -0
data/ext/math/src/zeta.h +15 -0
data/ext/pre-clean.rb +8 -0
data/ext/pre-setup.rb +9 -0
data/ext/util/doc/copying +504 -0
data/ext/util/src/listops.c +76 -0
data/ext/util/src/listops.h +26 -0
data/ext/util/src/makefile +103 -0
data/ext/util/src/memsys.c +84 -0
data/ext/util/src/memsys.h +42 -0
data/ext/util/src/nstats.c +288 -0
data/ext/util/src/nstats.h +69 -0
data/ext/util/src/params.c +86 -0
data/ext/util/src/params.h +19 -0
data/ext/util/src/parse.c +133 -0
data/ext/util/src/parse.h +81 -0
data/ext/util/src/scan.c +767 -0
data/ext/util/src/scan.h +111 -0
data/ext/util/src/symtab.c +443 -0
data/ext/util/src/symtab.h +121 -0
data/ext/util/src/tabscan.c +279 -0
data/ext/util/src/tabscan.h +99 -0
data/ext/util/src/util.mak +91 -0
data/ext/util/src/vecops.c +317 -0
data/ext/util/src/vecops.h +42 -0
data/lib/apriori.rb +133 -0
data/lib/apriori/adapter.rb +13 -0
data/lib/apriori/association_rule.rb +89 -0
data/lib/apriori/version.rb +9 -0
data/script/console +10 -0
data/script/destroy +14 -0
data/script/generate +14 -0
data/script/txt2html +82 -0
data/setup.rb +1585 -0
data/tasks/apriori.rake +20 -0
data/tasks/attic.rake +28 -0
data/tasks/deployment.rake +34 -0
data/tasks/environment.rake +7 -0
data/tasks/install.rake +13 -0
data/tasks/website.rake +17 -0
data/test/apriori_test.rb +13 -0
data/test/fixtures/market_basket_results_test.txt +5 -0
data/test/fixtures/market_basket_string_test.txt +7 -0
data/test/fixtures/results.txt +2 -0
data/test/fixtures/sample.txt +7 -0
data/test/test_helper.rb +5 -0
data/test/unit/test_apriori.rb +68 -0
data/test/unit/test_itemsets_and_parsing.rb +82 -0
data/website/index.html +248 -0
data/website/index.txt +152 -0
data/website/javascripts/rounded_corners_lite.inc.js +285 -0
data/website/stylesheets/screen.css +142 -0
data/website/template.html.erb +49 -0
metadata +226 -0

@@ -0,0 +1,69 @@
+/*----------------------------------------------------------------------
+  File    : nstats.h
+  Contents: management of normalization statistics
+  Author  : Christian Borgelt
+  History : 2003.08.12 file created
+            2004.08.12 description and parse function added
+----------------------------------------------------------------------*/
+#ifndef __NSTATS__
+#define __NSTATS__
+#include <stdio.h>
+#ifdef NST_PARSE
+#include "parse.h"
+#endif
+/*----------------------------------------------------------------------
+  Type Definitions
+----------------------------------------------------------------------*/
+typedef struct {                /* --- numerical statistics --- */
+  int    dim;                   /* dimension of data space */
+  double reg;                   /* number of registered patterns */
+  double *mins;                 /* minimal data values */
+  double *maxs;                 /* maximal data values */
+  double *sums;                 /* sums of data values */
+  double *sqrs;                 /* sums of squared data values */
+  double *offs;                 /* offsets for data scaling */
+  double facs[1];               /* factors for data scaling */
+} NSTATS;                       /* (numerical statistics) */
+/*----------------------------------------------------------------------
+  Functions
+----------------------------------------------------------------------*/
+extern NSTATS* nst_create (int dim);
+extern void    nst_delete (NSTATS *nst);
+extern int     nst_dim    (NSTATS *nst);
+extern void    nst_reg    (NSTATS *nst, const double *vec,
+                           double weight);
+extern void    nst_range  (NSTATS *nst, int idx,
+                           double min, double max);
+extern void    nst_expand (NSTATS *nst, int idx, double factor);
+extern void    nst_scale  (NSTATS *nst, int idx,
+                           double off, double fac);
+extern double  nst_min    (NSTATS *nst, int idx);
+extern double  nst_max    (NSTATS *nst, int idx);
+extern double  nst_offset (NSTATS *nst, int idx);
+extern double  nst_factor (NSTATS *nst, int idx);
+extern void    nst_norm   (NSTATS *nst, const double *vec, double *res);
+extern void    nst_inorm  (NSTATS *nst, const double *vec, double *res);
+extern void    nst_center (NSTATS *nst, double *vec);
+extern void    nst_spans  (NSTATS *nst, double *vec);
+extern int     nst_desc   (NSTATS *nst, FILE *file,
+                           const char *indent, int maxlen);
+#ifdef NST_PARSE
+extern NSTATS* nst_parse  (SCAN *scan, int dim);
+#endif
+/*----------------------------------------------------------------------
+  Preprocessor Definitions
+----------------------------------------------------------------------*/
+#define nst_dim(s)        ((s)->dim)
+#define nst_min(s,i)      ((s)->mins[i])
+#define nst_max(s,i)      ((s)->maxs[i])
+#define nst_offset(s,i)   ((s)->offs[i])
+#define nst_factor(s,i)   ((s)->facs[i])
+#endif

data/ext/util/src/params.c ADDED

@@ -0,0 +1,86 @@
+/*----------------------------------------------------------------------
+  File    : params.c
+  Contents: command line parameter retrieval
+  Author  : Christian Borgelt
+  History : 2003.06.05 file created
+----------------------------------------------------------------------*/
+#include <stdarg.h>
+#include <stdlib.h>
+#include <assert.h>
+#include "params.h"
+/*----------------------------------------------------------------------
+  Functions
+----------------------------------------------------------------------*/
+int getints (char *s, char **end, int n, ...)
+{                               /* --- get integer parameters */
+  va_list args;                 /* list of variable arguments */
+  int     k = 0, t;             /* parameter counter, buffer */
+  assert(s && end && (n > 0));  /* check the function arguments */
+  va_start(args, n);            /* get variable arguments */
+  while (k < n) {               /* traverse the arguments */
+    t = (int)strtol(s, end,10); /* get the next parameter and */
+    if (*end == s) break;       /* check for an empty parameter */
+    *(va_arg(args, int*)) = t;  /* store the parameter */
+    k++;                        /* and count it */
+    s = *end; if (*s++ != ':') break;
+  }                             /* check for a colon */
+  va_end(args);                 /* end argument evaluation */
+  return k;                     /* return the number of parameters */
+}  /* getints() */
+/*--------------------------------------------------------------------*/
+int getdbls (char *s, char **end, int n, ...)
+{                               /* --- get double parameters */
+  va_list args;                 /* list of variable arguments */
+  int     k = 0;                /* parameter counter */
+  double  t;                    /* temporary buffer */
+  assert(s && end && (n > 0));  /* check the function arguments */
+  va_start(args, n);            /* get variable arguments */
+  while (k < n) {               /* traverse the arguments */
+    t = strtod(s, end);         /* get the next parameter and */
+    if (*end == s) break;       /* check for an empty parameter */
+    *(va_arg(args, double*)) = t;  /* store the parameter */
+    k++;                           /* and count it */
+    s = *end; if (*s++ != ':') break;
+  }                             /* check for a colon */
+  va_end(args);                 /* end argument evaluation */
+  return k;                     /* return the number of parameters */
+}  /* getdbls() */
+/*--------------------------------------------------------------------*/
+int getintvec (char *s, char **end, int n, int *p)
+{                               /* --- get integer parameter vector */
+  int k = 0, t;                 /* parameter counter, buffer */
+  assert(s && end && (n > 0));  /* check the function arguments */
+  while (k < n) {               /* traverse the arguments */
+    t = (int)strtol(s, end,10); /* get the next parameter and */
+    if (*end == s) break;       /* check for an empty parameter */
+    p[k++] = t;                 /* store and count the parameter */
+    s = *end; if (*s++ != ':') break;
+  }                             /* check for a colon */
+  return k;                     /* return the number of parameters */
+}  /* getintvec() */
+/*--------------------------------------------------------------------*/
+int getdblvec (char *s, char **end, int n, double *p)
+{                               /* --- get double parameter vector */
+  int     k = 0;                /* parameter counter */
+  double  t;                    /* temporary buffer */
+  assert(s && end && (n > 0));  /* check the function arguments */
+  while (k < n) {               /* traverse the arguments */
+    t = strtod(s, end);         /* get the next parameter and */
+    if (*end == s) break;       /* check for an empty parameter */
+    p[k++] = t;                 /* store and count the parameter */
+    s = *end; if (*s++ != ':') break;
+  }                             /* check for a colon */
+  return k;                     /* return the number of parameters */
+}  /* getdblvec() */

data/ext/util/src/params.h ADDED

@@ -0,0 +1,19 @@
+/*----------------------------------------------------------------------
+  File    : params.h
+  Contents: command line parameter retrieval
+  Author  : Christian Borgelt
+  History : 2003.06.05 file created
+----------------------------------------------------------------------*/
+#ifndef __PARAMS__
+#define __PARAMS__
+/*----------------------------------------------------------------------
+  Functions
+----------------------------------------------------------------------*/
+extern int getints   (char *s, char **end, int n, ...);
+extern int getdbls   (char *s, char **end, int n, ...);
+extern int getintvec (char *s, char **end, int n, int    *p);
+extern int getdblvec (char *s, char **end, int n, double *p);
+#endif

data/ext/util/src/parse.c ADDED

@@ -0,0 +1,133 @@
+/*----------------------------------------------------------------------
+  File    : parse.h
+  Contents: parser utilities
+  Author  : Christian Borgelt
+  History : 2004.08.12 file created
+            2006.02.02 error E_EDGE added
+            2007.01.16 error E_MSDCNT added
+----------------------------------------------------------------------*/
+#include <string.h>
+#include <assert.h>
+#include "parse.h"
+/*----------------------------------------------------------------------
+  Constants
+----------------------------------------------------------------------*/
+#ifdef GERMAN                     /* deutsche Texte */
+static const char *errmsgs[] = {  /* Fehlermeldungen */
+  /* E_CHREXP  -16 */  "\"%c\" erwartet statt %s",
+  /* E_STREXP  -17 */  "\"%s\" erwartet statt %s",
+  /* E_NUMEXP  -18 */  "Zahl erwartet statt %s",
+  /* E_NUMBER  -19 */  "ungültige Zahl %s",
+  /* E_ATTEXP  -20 */  "Attribut erwartet statt %s",
+  /* E_UNKATT  -21 */  "unbekanntes Attribut %s",
+  /* E_DUPATT  -22 */  "doppeltes Attribut %s",
+  /* E_MISATT  -23 */  "Attribut %s fehlt",
+  /* E_ATTRIB  -24 */  "ungültiges Attribut %s",
+  /* E_ATTYPE  -25 */  "Attribut %s hat falschen Typ",
+  /* E_VALEXP  -26 */  "Attributwert erwartet statt %s",
+  /* E_UNKVAL  -27 */  "unbekannter Attributwert %s",
+  /* E_DUPVAL  -28 */  "doppelter Attributwert %s",
+  /* E_MISVAL  -29 */  "fehlender Attributwert %s",
+  /* E_CLSEXP  -30 */  "Klassenattribut erwartet statt %s",
+  /* E_UNKCLS  -31 */  "unbekannte Klasse %s",
+  /* E_DUPCLS  -32 */  "doppelte Klasse %s",
+  /* E_MISCLS  -33 */  "Klasse %s fehlt",
+  /* E_CLSTYPE -34 */  "Klassenattribut %s hat falschen Typ",
+  /* E_CLSCNT  -35 */  "Klassenattribut %s hat zu wenige Werte",
+  /* E_DOMAIN  -36 */  "ungültiger Wertebereich %s",
+  /* E_PAREXP  -37 */  "Parameter erwartet statt %s",
+  /* E_CMPOP   -38 */  "ungültiger Vergleichsoperator %s",
+  /* E_COVMAT  -39 */  "ungültige Kovarianzmatrix",
+  /* E_DUPCDL  -40 */  "doppelte Kandidatenliste für Attribut %s\n",
+  /* E_RANGE   -41 */  "ungültiger Kandidatenbereich",
+  /* E_CAND    -42 */  "ungültiger Kandidat %s",
+  /* E_LINK    -43 */  "ungültiger Verweis",
+  /* E_LYRCNT  -44 */  "ungültige Anzahl Schichten",
+  /* E_UNITCNT -45 */  "ungültige Anzahl Einheiten",
+  /* E_EDGE    -46 */  "ungültiger Kantentyp %s",
+  /* E_MSDCNT  -47 */  "falsche Anzahl Zugehörigkeitsgrade",
+};
+#else                             /* English texts */
+static const char *errmsgs[] = {  /* error messages */
+  /* E_CHREXP  -16 */  "\"%c\" expected instead of %s",
+  /* E_STREXP  -17 */  "\"%s\" expected instead of %s",
+  /* E_NUMEXP  -18 */  "number expected instead of %s",
+  /* E_NUMBER  -19 */  "invalid number %s",
+  /* E_ATTEXP  -20 */  "attribute expected instead of %s",
+  /* E_UNKATT  -21 */  "unknown attribute %s",
+  /* E_DUPATT  -22 */  "duplicate attribute %s",
+  /* E_MISATT  -23 */  "missing attribute %s",
+  /* E_ATTRIB  -24 */  "invalid attribute %s",
+  /* E_ATTYPE  -25 */  "attribute %s has wrong type",
+  /* E_VALEXP  -26 */  "attribute value expected instead of %s",
+  /* E_UNKVAL  -27 */  "unknown attribute value %s",
+  /* E_DUPVAL  -28 */  "duplicate attribute value %s",
+  /* E_MISVAL  -29 */  "missing attribute value %s",
+  /* E_CLSEXP  -30 */  "class value expected instead of %s",
+  /* E_UNKCLS  -31 */  "unknown class value %s",
+  /* E_DUPCLS  -32 */  "duplicate class value %s",
+  /* E_MISCLS  -33 */  "missing class value %s",
+  /* E_CLSTYPE -34 */  "class attribute %s has wrong type",
+  /* E_CLSCNT  -35 */  "class attribute %s has too few values",
+  /* E_DOMAIN  -36 */  "invalid attribute domain %s",
+  /* E_PAREXP  -37 */  "parameter expected instead of %s",
+  /* E_CMPOP   -38 */  "invalid comparison operator %s",
+  /* E_COVMAT  -39 */  "invalid covariance matrix",
+  /* E_DUPCDL  -40 */  "duplicate candidate list for attribute %s\n",
+  /* E_RANGE   -41 */  "invalid candidate range",
+  /* E_CAND    -42 */  "invalid candidate %s",
+  /* E_LINK    -43 */  "invalid link",
+  /* E_LYRCNT  -44 */  "invalid number of layers",
+  /* E_UNITCNT -45 */  "invalid number of units",
+  /* E_EDGE    -46 */  "invalid edge type %s",
+  /* E_MSDCNT  -47 */  "wrong number of membership degrees",
+};
+#endif
+#define MSGCNT  (int)(sizeof(errmsgs)/sizeof(const char*))
+/*----------------------------------------------------------------------
+  Functions
+----------------------------------------------------------------------*/
+void pa_init (SCAN *scan)       /* --- initialize parsing */
+{ sc_errmsgs(scan, errmsgs, MSGCNT); }
+/*--------------------------------------------------------------------*/
+int pa_error (SCAN *scan, int code, int c, const char *s)
+{                               /* --- report a parse error */
+  char src[256], dst[1024];     /* buffers for string formating */
+  assert(scan);                 /* check the function arguments */
+  if (((code == E_DUPATT) || (code == E_MISATT)
+  ||   (code == E_DUPVAL) || (code == E_MISVAL)
+  ||   (code == E_DUPCLS) || (code == E_MISCLS)
+  ||   (code == E_CAND))  && s)
+    sc_format(dst, s,   1);     /* if "missing ..." error message, */
+  else {                        /* format the given name */
+    strncpy(src, sc_value(scan), 255); src[255] = '\0';
+    sc_format(dst, src, 1);     /* if normal error message, */
+  }                             /* copy and format the token value */
+  if      (code == E_CHREXP) return sc_error(scan, code, c, dst);
+  else if (code == E_STREXP) return sc_error(scan, code, s, dst);
+  else                       return sc_error(scan, code,    dst);
+}  /* _paerr() */               /* print an error message */

data/ext/util/src/parse.h ADDED

@@ -0,0 +1,81 @@
+/*----------------------------------------------------------------------
+  File    : parse.h
+  Contents: parser utilities
+  Author  : Christian Borgelt
+  History : 2004.08.12 file created
+            2006.02.02 error E_EDGE   added
+            2007.01.16 error E_MSDCNT added
+----------------------------------------------------------------------*/
+#ifndef __PARSE__
+#define __PARSE__
+#ifndef SC_SCAN
+#define SC_SCAN
+#endif
+#include "scan.h"
+/*----------------------------------------------------------------------
+  Preprocessor Definitions
+----------------------------------------------------------------------*/
+/* --- error codes --- */
+#define E_CHREXP    (-16)       /* character expected */
+#define E_STREXP    (-17)       /* string expected */
+#define E_NUMEXP    (-18)       /* number expected */
+#define E_NUMBER    (-19)       /* invalid number */
+#define E_ATTEXP    (-20)       /* attribute expected */
+#define E_UNKATT    (-21)       /* unknown attribute */
+#define E_DUPATT    (-22)       /* duplicate attribute value */
+#define E_MISATT    (-23)       /* missing attribute */
+#define E_ATTRIB    (-24)       /* invalid attribute */
+#define E_ATTYPE    (-25)       /* wrong attribute type */
+#define E_VALEXP    (-26)       /* attribute value expected */
+#define E_UNKVAL    (-27)       /* unknown attribute value */
+#define E_DUPVAL    (-28)       /* duplicate attribute value */
+#define E_MISVAL    (-29)       /* missing attribute value */
+#define E_CLSEXP    (-30)       /* class value expected */
+#define E_UNKCLS    (-31)       /* unknown class value */
+#define E_DUPCLS    (-32)       /* duplicate class value */
+#define E_MISCLS    (-33)       /* missing class value */
+#define E_CLSTYPE   (-34)       /* class attribute must be nominal */
+#define E_CLSCNT    (-35)       /* class attribute has too few values */
+#define E_DOMAIN    (-36)       /* invalid attribute domain */
+#define E_PAREXP    (-37)       /* parameter expected */
+#define E_CMPOP     (-38)       /* invalid comparison operator */
+#define E_COVMAT    (-39)       /* invalid covariance matrix */
+#define E_DUPCDL    (-40)       /* duplicate candidate list */
+#define E_RANGE     (-41)       /* invalid candidate range */
+#define E_CAND      (-42)       /* invalid candidate */
+#define E_LINK      (-43)       /* invalid link */
+#define E_LYRCNT    (-44)       /* invalid number of layers */
+#define E_UNITCNT   (-45)       /* invalid number of units */
+#define E_EDGE      (-46)       /* invalid edge type */
+#define E_MSDCNT    (-47)       /* wrong number of membership degrees */
+/*----------------------------------------------------------------------
+  Functions
+----------------------------------------------------------------------*/
+extern void pa_init  (SCAN *scan);
+extern int  pa_error (SCAN *scan, int code, int c, const char *s);
+/*----------------------------------------------------------------------
+  Preprocessor Definitions
+----------------------------------------------------------------------*/
+#define ERROR(c)    return pa_error(scan, c,        -1, NULL)
+#define XERROR(c,s) return pa_error(scan, c,        -1, s)
+#define ERR_CHR(c)  return pa_error(scan, E_CHREXP,  c, NULL)
+#define ERR_STR(s)  return pa_error(scan, E_STREXP, -1, s)
+#define GET_TOK()   if (sc_next(scan) < 0) \
+                      return sc_error(scan, sc_token(scan))
+#define GET_CHR(c)  if (sc_token(scan) != (c)) ERR_CHR(c); \
+                      else GET_TOK()
+#define RECOVER()   if (sc_recover(scan, ';', '{', '}', 0) == T_EOF) \
+                      return 1
+#endif

data/ext/util/src/scan.c ADDED

@@ -0,0 +1,767 @@
+/*----------------------------------------------------------------------
+  File    : scan.c
+  Contents: scanner (lexical analysis of a character stream)
+  Author  : Christian Borgelt
+  History : 1996.01.16 file created
+            1996.02.21 identifier recognition made more flexible
+            1996.03.17 keyword tokens removed
+            1996.04.15 duplicate state removed from sc_next
+            1997.07.29 < and > declared active (for decision trees)
+            1997.09.08 escape sequences in strings made possible
+            1997.09.11 single characters stored also in scn->value
+            1998.02.08 recover and error message functions added
+            1998.02.09 bug in state S_NUMPT concerning "-." removed
+            1998.02.13 token T_RGT ('->') added
+            1998.03.04 returned tokens changed for some states
+            1998.04.17 token T_LFT ('<-') added
+            1998.05.27 token T_CMP (two char comparison operator) added
+            1998.05.31 token conversion to number removed
+            1999.02.08 reading from standard input made possible
+            1999.04.29 quoted string parsing improved
+            1999.11.13 token string length stored in scn->len
+            2000.11.23 functions sc_fmtlen and sc_format added
+            2001.07.15 scanner made an object, state definitions added
+            2001.07.16 characters with code > 127 made printable
+                       look ahead functionality added (sc_back)
+            2006.02.02 token T_DASH (undirected edge '--') added
+----------------------------------------------------------------------*/
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <stdarg.h>
+#include <assert.h>
+#include "scan.h"
+#ifdef STORAGE
+#include "storage.h"
+#endif
+/*----------------------------------------------------------------------
+  Preprocessor Definitions
+----------------------------------------------------------------------*/
+#ifdef SC_SCAN
+/* --- character classes --- */
+#define C_INVALID    0          /* invalid character */
+#define C_SPACE      1          /* white space, e.g. ' ' '\t' '\n' */
+#define C_LETTER     2          /* letter or underscore '_' */
+#define C_DIGIT      3          /* digit */
+#define C_POINT      4          /* point, '.' */
+#define C_SIGN       5          /* sign,  '+' or '-' */
+#define C_SLASH      6          /* slash, '/' */
+#define C_QUOTE      7          /* quote, e.g. '"' '`' */
+#define C_CMPOP      8          /* comparison operator, e.g. '<' */
+#define C_ACTIVE     9          /* active characters, e.g. ',' '(' */
+/* --- scanner states --- */
+#define S_SPACE      0          /* skipping white space */
+#define S_ID         1          /* reading identifier */
+#define S_NUMDIG     2          /* reading number, digit */
+#define S_NUMPT      3          /* reading number, decimal point */
+#define S_FRAC       4          /* reading number, digit and point */
+#define S_EXPIND     5          /* reading exponent, indicator */
+#define S_EXPSGN     6          /* reading exponent, sign */
+#define S_EXPDIG     7          /* reading exponent, digit */
+#define S_SIGN       8          /* sign read */
+#define S_CMPOP      9          /* reading comparison operator */
+#define S_STRING    10          /* reading quoted string */
+#define S_ESC       11          /* reading escaped character */
+#define S_OCT1      12          /* reading octal  number, 1 digit */
+#define S_OCT2      13          /* reading octal  number, 2 digits */
+#define S_HEX1      14          /* reading hexad. number, 1 digit */
+#define S_HEX2      15          /* reading hexad. number, 2 digits */
+#define S_SLASH     16          /* slash read */
+#define S_CPPCOM    17          /* reading C++ comment */
+#define S_CCOM1     18          /* reading C comment */
+#define S_CCOM2     19          /* reading C comment, possible end */
+#define S_CCOM3     20          /* reading C comment, possible start */
+/* --- functions --- */
+#define UNGETC(s,c)  do { if ((c) ==  EOF) break; \
+                          if ((c) == '\n') (s)->line--; \
+                          ungetc(c, (s)->file); } while (0)
+/* --- additional error codes --- */
+#define E_UNKNOWN   (-11)       /* unknown error */
+#define MSGOFFSET   (-16)       /* offset for add. error messages */
+/* --- texts --- */
+#ifdef GERMAN                   /* deutsche Texte */
+#define FILETXT     "Datei"
+#define LINETXT     "Zeile"
+#else                           /* English texts */
+#define FILETXT     "file"
+#define LINETXT     "line"
+#endif  /* #ifdef GERMAN .. #else .. */
+#endif  /* #ifdef SC_SCAN */
+/*----------------------------------------------------------------------
+  Constants
+----------------------------------------------------------------------*/
+static const char _scftab[256] = {  /* scanable form classes */
+        /* NUL  SOH  STX  ETX  EOT  ENQ  ACK  BEL */
+/* 00 */    2,   2,   2,   2,   2,   2,   2,  'a',
+        /*  BS   HT   LF   VT   FF   CR   SO   SI */
+           'b', 't', 'n', 'v', 'f', 'r',  2,   2,
+        /* DLE  DC1  DC2  DC3  DC4  NAK  SYN  ETB */
+/* 10 */    2,   2,   2,   2,   2,   2,   2,   2,
+        /* CAN   EM  SUB  ESC   FS   GS   RS   US */
+            2,   2,   2,   2,   2,   2,   2,   2,
+        /* ' '  '!'  '"'  '#'  '$'  '%'  '&'  ''' */
+/* 20 */    1,   1,  '"',  1,   1,   1,   1,   1,
+        /* '('  ')'  '*'  '+'  ','  '-'  '.'  '/' */
+            1,   1,   1,   0,   1,   0,   0,   1,
+        /* '0'  '1'  '2'  '3'  '4'  '5'  '6'  '7' */
+/* 30 */    0,   0,   0,   0,   0,   0,   0,   0,
+        /* '8'  '9'  ':'  ';'  '<'  '='  '>'  '?' */
+            0,   0,   1,   1,   1,   1,   1,   1,
+        /* '@'  'A'  'B'  'C'  'D'  'E'  'F'  'G' */
+/* 40 */    1,   0,   0,   0,   0,   0,   0,   0,
+        /* 'H'  'I'  'J'  'K'  'L'  'M'  'N'  'O' */
+            0,   0,   0,   0,   0,   0,   0,   0,
+        /* 'P'  'Q'  'R'  'S'  'T'  'U'  'V'  'W' */
+/* 50 */    0,   0,   0,   0,   0,   0,   0,   0,
+        /* 'X'  'Y'  'Z'  '['  '\'  ']'  '^'  '_' */
+            0,   0,   0,   1, '\\',  1,   1,   0,
+        /* '`'  'a'  'b'  'c'  'd'  'e'  'f'  'g' */
+/* 60 */    1,   0,   0,   0,   0,   0,   0,   0,
+        /* 'h'  'i'  'j'  'k'  'l'  'm'  'n'  'o' */
+            0,   0,   0,   0,   0,   0,   0,   0,
+        /* 'p'  'q'  'r'  's'  't'  'u'  'v'  'w' */
+/* 70 */    0,   0,   0,   0,   0,   0,   0,   0,
+        /* 'x'  'y'  'z'  '{'  '|'  '}'  '~'  DEL */
+            0,   0,   0,   1,   1,   1,   1,   2,
+/* 80 */    1,   1,   1,   1,   1,   1,   1,   1,
+            1,   1,   1,   1,   1,   1,   1,   1,
+/* 90 */    1,   1,   1,   1,   1,   1,   1,   1,
+            1,   1,   1,   1,   1,   1,   1,   1,
+/* a0 */    1,   1,   1,   1,   1,   1,   1,   1,
+            1,   1,   1,   1,   1,   1,   1,   1,
+/* b0 */    1,   1,   1,   1,   1,   1,   1,   1,
+            1,   1,   1,   1,   1,   1,   1,   1,
+/* c0 */    1,   1,   1,   1,   1,   1,   1,   1,
+            1,   1,   1,   1,   1,   1,   1,   1,
+/* d0 */    1,   1,   1,   1,   1,   1,   1,   1,
+            1,   1,   1,   1,   1,   1,   1,   1,
+/* e0 */    1,   1,   1,   1,   1,   1,   1,   1,
+            1,   1,   1,   1,   1,   1,   1,   1,
+/* f0 */    1,   1,   1,   1,   1,   1,   1,   1,
+            1,   1,   1,   1,   1,   1,   1,   1 };
+#ifdef SC_SCAN
+static const char _ccltab[256] = {  /* character classes */
+        /* NUL  SOH  STX  ETX  EOT  ENQ  ACK  BEL */
+/* 00 */    0,   0,   0,   0,   0,   0,   0,   0,
+        /*  BS   HT   LF   VT   FF   CR   SO   SI */
+            0,   1,   1,   1,   1,   1,   0,   0,
+        /* DLE  DC1  DC2  DC3  DC4  NAK  SYN  ETB */
+/* 10 */    0,   0,   0,   0,   0,   0,   0,   0,
+        /* CAN   EM  SUB  ESC   FS   GS   RS   US */
+            0,   0,   0,   0,   0,   0,   0,   0,
+        /* ' '  '!'  '"'  '#'  '$'  '%'  '&'  ''' */
+/* 20 */    1,   8,   7,   9,   9,   9,   9,   7,
+        /* '('  ')'  '*'  '+'  ','  '-'  '.'  '/' */
+            9,   9,   9,   5,   9,   5,   4,   6,
+        /* '0'  '1'  '2'  '3'  '4'  '5'  '6'  '7' */
+/* 30 */    3,   3,   3,   3,   3,   3,   3,   3,
+        /* '8'  '9'  ':'  ';'  '<'  '='  '>'  '?' */
+            3,   3,   9,   9,   8,   8,   8,   9,
+        /* '@'  'A'  'B'  'C'  'D'  'E'  'F'  'G' */
+/* 40 */    0,   2,   2,   2,   2,   2,   2,   2,
+        /* 'H'  'I'  'J'  'K'  'L'  'M'  'N'  'O' */
+            2,   2,   2,   2,   2,   2,   2,   2,
+        /* 'P'  'Q'  'R'  'S'  'T'  'U'  'V'  'W' */
+/* 50 */    2,   2,   2,   2,   2,   2,   2,   2,
+        /* 'X'  'Y'  'Z'  '['  '\'  ']'  '^'  '_' */
+            2,   2,   2,   9,   9,   9,   9,   2,
+        /* '`'  'a'  'b'  'c'  'd'  'e'  'f'  'g' */
+/* 60 */    7,   2,   2,   2,   2,   2,   2,   2,
+        /* 'h'  'i'  'j'  'k'  'l'  'm'  'n'  'o' */
+            2,   2,   2,   2,   2,   2,   2,   2,
+        /* 'p'  'q'  'r'  's'  't'  'u'  'v'  'w' */
+/* 70 */    2,   2,   2,   2,   2,   2,   2,   2,
+        /* 'x'  'y'  'z'  '{'  '|'  '}'  '~'  DEL */
+            2,   2,   2,   9,   9,   9,   9,   0,
+/* 80 */    0,   0,   0,   0,   0,   0,   0,   0,
+            0,   0,   0,   0,   0,   0,   0,   0,
+/* 90 */    0,   0,   0,   0,   0,   0,   0,   0,
+            0,   0,   0,   0,   0,   0,   0,   0,
+/* a0 */    0,   0,   0,   0,   0,   0,   0,   0,
+            0,   0,   0,   0,   0,   0,   0,   0,
+/* b0 */    0,   0,   0,   0,   0,   0,   0,   0,
+            0,   0,   0,   0,   0,   0,   0,   0,
+/* c0 */    0,   0,   0,   0,   0,   0,   0,   0,
+            0,   0,   0,   0,   0,   0,   0,   0,
+/* d0 */    0,   0,   0,   0,   0,   0,   0,   0,
+            0,   0,   0,   0,   0,   0,   0,   0,
+/* e0 */    0,   0,   0,   0,   0,   0,   0,   0,
+            0,   0,   0,   0,   0,   0,   0,   0,
+/* f0 */    0,   0,   0,   0,   0,   0,   0,   0,
+            0,   0,   0,   0,   0,   0,   0,   0 };
+#ifdef GERMAN                      /* deutsche Texte */
+static const char *_errmsgs[] = {  /* error messages */
+  /* E_NONE      0 */  "kein Fehler",
+  /* E_NOMEM    -1 */  "nicht genug Speicher",
+  /* E_FOPEN    -2 */  "�ffnen fehlgeschlagen",
+  /* E_FREAD    -3 */  "Lesefehler",
+  /* E_FWRITE   -4 */  "Schreibfehler",
+  /* E_CHAR     -5 */  "ung�ltiges Zeichen '%c' (0x%02x)",
+  /* E_BUFOVF   -6 */  "Puffer�berlauf",
+  /* E_UNTSTR   -7 */  "unbeendete Zeichenkette",
+  /* E_UNTCOM   -8 */  "unerwartetes Dateiende in Kommentar "
+                       "(Anfang in Zeile %d)",
+  /* E_STATE    -9 */  "ung�ltiger Scannerzustand",
+  /* E_GARBAGE -10 */  "ung�ltiger Text am Dateiende",
+  /* E_UNKNOWN -11 */  "unbekannter Fehler"
+};
+#else                              /* English texts */
+static const char *_errmsgs[] = {  /* error messages */
+  /* E_NONE      0 */  "no error",
+  /* E_NOMEM    -1 */  "not enough memory",
+  /* E_FOPEN    -2 */  "file open failed",
+  /* E_FREAD    -3 */  "file read failed",
+  /* E_FWRITE   -4 */  "file write failed",
+  /* E_CHAR     -5 */  "invalid character '%c' (0x%02x)",
+  /* E_BUFOVF   -6 */  "scan buffer overflow",
+  /* E_UNTSTR   -7 */  "unterminated string",
+  /* E_UNTCOM   -8 */  "unexpected end of file in comment "
+                       "started on line %d",
+  /* E_STATE    -9 */  "invalid scanner state",
+  /* E_GARBAGE -10 */  "garbage at end of file",
+  /* E_UNKNOWN -11 */  "unknown error"
+};
+#endif  /* #ifdef GERMAN .. #else .. */
+#endif  /* #ifdef SC_SCAN */
+/*----------------------------------------------------------------------
+  Auxiliary Functions
+----------------------------------------------------------------------*/
+#ifdef SC_SCAN
+static int _swap (SCAN *scan)
+{                               /* --- swap token information */
+  int t;                        /* swap buffer */
+  if (scan->value == scan->buf[0]) scan->value = scan->buf[1];
+  else                             scan->value = scan->buf[0];
+  t = scan->plen;   scan->plen   = scan->len;   scan->len   = t;
+  t = scan->pline;  scan->pline  = scan->line;  scan->line  = t;
+  t = scan->ptoken; scan->ptoken = scan->token; scan->token = t;
+  return t;                     /* return the new token */
+}  /* _swap() */
+#endif
+/*----------------------------------------------------------------------
+  Main Functions
+----------------------------------------------------------------------*/
+int sc_fmtlen (const char *s, int *len)
+{                               /* --- length of a formatted name */
+  int n = 0, k = 0;             /* number of (additional) characters */
+  int q = 0;                    /* quote flag (default: no quotes) */
+  assert(s);                    /* check the function arguments */
+  while (*s) {                  /* while not at end of name */
+    n++;                        /* count character */
+    switch (_scftab[(unsigned char)*s++]) {
+      case  0:                break;
+      case  1:         q = 2; break;
+      case  2: k += 3; q = 2; break;
+      default: k += 1; q = 2; break;
+    }                           /* sum additional characters and */
+  }                             /* set quote flag (if necessary) */
+  if (len) *len = n;            /* store normal length and */
+  return n +k +q;               /* return length of scanable form */
+}  /* sc_fmtlen() */
+/*--------------------------------------------------------------------*/
+int sc_format (char *dst, const char *src, int quotes)
+{                               /* --- format name in scanable form */
+  char *d; const char *s;       /* to traverse buffer and name */
+  int  c, cls;                  /* character and character class */
+  int  t;                       /* temporary buffer */
+  assert(dst && src);           /* check the function arguments */
+  if (!*src) quotes = 1;        /* an empty name needs quotes */
+  if (!quotes) {                /* if quotes are not mandatory, */
+    for (s = src; *s; )         /* traverse the string to convert */
+      if (_scftab[(unsigned char)*s++] != 0) {
+        quotes = 1; break; }    /* if a character needs quotes, */
+  }                             /* set the quotes flag and abort */
+  d = dst;                      /* get the destination and */
+  if (quotes) *d++ = '"';       /* store a quote if necessary */
+  while (*src) {                /* traverse the characters */
+    c   = (unsigned char)*src++;/* get the next character */
+    cls = _scftab[c];           /* and its character class */
+    if      (cls < 2)           /* if it is a normal character, */
+      *d++ = c;                 /* just store it */
+    else if (cls > 2) {         /* if it is an ANSI escape character, */
+      *d++ = '\\'; *d++ = cls;} /* store it as '\c' */
+    else {                      /* if it is any other character */
+      *d++ = '\\'; *d++ = 'x';
+      t = c >> 4;  *d++ = (t > 9) ? (t -10 +'a') : (t +'0');
+      t = c & 0xf; *d++ = (t > 9) ? (t -10 +'a') : (t +'0');
+    }                           /* store the character code */
+  }                             /* as a hexadecimal number */
+  if (quotes) *d++ = '"';       /* store the closing quote */
+  *d = '\0';                    /* and terminate the string */
+  return (int)(d -dst);         /* return the length of the result */
+}  /* sc_format() */
+/*--------------------------------------------------------------------*/
+#ifdef SC_SCAN
+SCAN* sc_create (const char *fname)
+{                               /* --- create a scanner */
+  const char *fn = fname;       /* buffer for filename */
+  SCAN       *scan;             /* created scanner */
+  if (!fn || !*fn) fname = "<stdin>";
+  scan = (SCAN*)malloc(sizeof(SCAN) +strlen(fname));
+  if (!scan) return NULL;       /* allocate memory for a scanner */
+  strcpy(scan->fname, fname);   /* and note the file name */
+  if (!fn || !*fn)              /* if no file name is given, */
+    scan->file = stdin;         /* read from standard input */
+  else {                        /* if a  file name is given, */
+    scan->file = fopen(fn,"r"); /* open the file for reading */
+    if (!scan->file) { free(scan); return NULL; }
+  }
+  scan->line    = 1;            /* initialize the fields */
+  scan->token   = scan->len   = scan->start = 0;
+  scan->value   = scan->buf[0]; scan->buf[0][0] = '\0';
+  scan->back    = 0;
+  scan->errfile = stderr;
+  scan->msgcnt  = scan->lncnt = 0;
+  scan->msgs    = NULL;
+  return scan;                  /* return created scanner */
+}  /* sc_create() */
+/*--------------------------------------------------------------------*/
+void sc_delete (SCAN *scan)
+{                               /* --- delete a scanner */
+  if (scan->file != stdin) fclose(scan->file);
+  free(scan);                   /* close the input file and */
+}  /* sc_delete() */            /* delete the scanner structure */
+/*--------------------------------------------------------------------*/
+int sc_next (SCAN *scan)
+{                               /* --- get next token */
+  int  c, ccl;                  /* character and character class */
+  int  quote = 0;               /* quote at the start of a string */
+  int  ec    = 0;               /* escaped character */
+  int  state = 0;               /* state of automaton */
+  int  level = 0;               /* comment nesting level */
+  char *p;                      /* to traverse the scan buffer */
+  char *end;                    /* end of the scan buffer */
+  if (scan->back) {             /* if a step backwards has been made, */
+    scan->back = 0;             /* clear the corresponding flag, */
+    return _swap(scan);         /* swap back the token information, */
+  }                             /* and return the current token */
+  scan->pline  = scan->line;    /* note the relevant information */
+  scan->ptoken = scan->token;   /* of the current token */
+  scan->plen   = scan->len;     /* and swap scan buffers */
+  if (scan->value == scan->buf[0]) scan->value = p = scan->buf[1];
+  else                             scan->value = p = scan->buf[0];
+  end = p +SC_BUFSIZE -1;       /* get the end of the scan buffer */
+  while (1) {                   /* read loop */
+    c   = getc(scan->file);     /* get character and character class */
+    ccl = (c < 0) ? EOF : _ccltab[c];
+    if (c == '\n') scan->line++; /* count the line */
+    switch (state) {            /* evaluate state of automaton */
+      case S_SPACE:             /* --- skip white space */
+        switch (ccl) {          /* evaluate character category */
+          case C_SPACE : /* do nothing */             break;
+          case C_LETTER: *p++  = c; state = S_ID;     break;
+          case C_DIGIT : *p++  = c; state = S_NUMDIG; break;
+          case C_POINT : *p++  = c; state = S_NUMPT;  break;
+          case C_SIGN  : *p++  = c; state = S_SIGN;   break;
+          case C_CMPOP : *p++  = c; state = S_CMPOP;  break;
+          case C_QUOTE : quote = c; state = S_STRING; break;
+          case C_SLASH :            state = S_SLASH;  break;
+          case C_ACTIVE: *p++  = c; *p = '\0'; scan->len = 1;
+                         return scan->token = c;
+          case EOF     : strcpy(p, "<eof>");   scan->len = 4;
+                         return scan->token = (ferror(scan->file))
+                                           ? E_FREAD : T_EOF;
+          default      : *p++  = c; *p = '\0'; scan->len = 1;
+                         return scan->token = E_CHAR;
+        } break;
+      case S_ID:                /* --- identifier (letter read) */
+        if ((ccl == C_LETTER)   /* if another letter */
+        ||  (ccl == C_DIGIT)    /* or a digit */
+        ||  (ccl == C_POINT)    /* or a decimal point */
+        ||  (ccl == C_SIGN)) {  /* or a sign follows */
+          if (p >= end) return scan->token = E_BUFOVF;
+          *p++ = c; break;      /* buffer character */
+        }                       /* otherwise */
+        UNGETC(scan, c);        /* put back last character, */
+        *p = '\0';              /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token = T_ID;   /* and return 'identifier' */
+      case S_NUMDIG:            /* --- number (digit read) */
+        if (p < end) *p++ = c;  /* buffer character */
+        else return scan->token = E_BUFOVF;
+        if  (ccl == C_DIGIT)    /* if another digit follows, */
+          break;                /* do nothing */
+        if  (ccl == C_POINT) {  /* if a decimal point follows, */
+          state = S_FRAC;   break; } /* go to 'fraction' state */
+        if ((c == 'e')          /* if an exponent indicator follows */
+        ||  (c == 'E')) {       /* (lower- or uppercase), */
+          state = S_EXPIND; break; } /* go to 'exponent' state */
+        if ((ccl == C_LETTER)   /* if a letter */
+        ||  (ccl == C_SIGN)) {  /* or a sign follows, */
+          state = S_ID; break;  /* go to 'identifier' state */
+        }                       /* otherwise */
+        UNGETC(scan, c);        /* put back last character, */
+        *--p = '\0';            /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token = T_NUM;      /* and return 'number' */
+      case S_NUMPT:             /* --- number (point read) */
+        if (p < end) *p++ = c;  /* buffer character */
+        else return scan->token = E_BUFOVF;
+        if  (ccl == C_DIGIT) {       /* if a digit follows, */
+          state = S_FRAC; break; }   /* go to 'fraction' state */
+        if ((ccl == C_LETTER)   /* if a letter */
+        ||  (ccl == C_POINT)    /* or a decimal point */
+        ||  (ccl == C_SIGN)) {  /* or a sign follows */
+          state = S_ID; break;  /* go to 'identifier' state */
+        }                       /* otherwise */
+        UNGETC(scan, c);        /* put back last character, */
+        *--p = '\0';            /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token = T_ID;   /* and return 'identifier' */
+      case S_FRAC:              /* --- number (digit & point read) */
+        if (p < end) *p++ = c;  /* buffer character */
+        else return scan->token = E_BUFOVF;
+        if  (ccl == C_DIGIT)    /* if another digit follows, */
+          break;                /* do nothing else */
+        if ((c == 'e')          /* if an exponent indicator follows, */
+        ||  (c == 'E')) {       /* (lower- or uppercase), */
+          state = S_EXPIND; break; } /* go to exponent state */
+        if ((ccl == C_LETTER)   /* if a letter */
+        ||  (ccl == C_POINT)    /* or a decimal point */
+        ||  (ccl == C_SIGN)) {  /* or a sign follows, */
+          state = S_ID; break;  /* go to 'identifier' state */
+        }                       /* otherwise */
+        UNGETC(scan, c);        /* put back last character, */
+        *--p = '\0';            /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token = T_NUM;      /* and return 'number' */
+      case S_EXPIND:            /* --- exponent (indicator read) */
+        if (p < end) *p++ = c;  /* buffer character */
+        else return scan->token = E_BUFOVF;
+        if  (ccl == C_SIGN) {        /* if a sign follows, */
+          state = S_EXPSGN; break; } /* go to 2nd 'exponent' state */
+        if  (ccl == C_DIGIT) {       /* if a digit follows, */
+          state = S_EXPDIG; break; } /* go to 3rd 'exponent' state */
+        if ((ccl == C_LETTER)   /* if a letter */
+        ||  (ccl == C_POINT)) { /* or a decimal point follows */
+          state = S_ID; break;  /* go to 'identifier' state */
+        }                       /* otherwise */
+        UNGETC(scan, c);        /* put back last character, */
+        *--p = '\0';            /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token = T_ID;   /* and return 'identifier' */
+      case S_EXPSGN:            /* --- exponent (sign read) */
+        if (p < end) *p++ = c;  /* buffer character */
+        else return scan->token = E_BUFOVF;
+        if  (ccl == C_DIGIT) {      /* if a digit follows, */
+          state = S_EXPDIG; break;} /* do nothing else */
+        if ((ccl == C_LETTER)   /* if a letter */
+        ||  (ccl == C_POINT)    /* or a decimal point */
+        ||  (ccl == C_SIGN)) {  /* or a sign follows */
+          state = S_ID; break;  /* go to 'identifier' state */
+        }                       /* otherwise */
+        UNGETC(scan, c);        /* put back last character, */
+        *--p = '\0';            /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token = T_ID;   /* and return 'identifier' */
+      case S_EXPDIG:            /* --- exponent (digit read) */
+        if (p < end) *p++ = c;  /* buffer character */
+        else return scan->token = E_BUFOVF;
+        if  (ccl == C_DIGIT)    /* if another digit follows, */
+          break;                /* do nothing else */
+        if ((ccl == C_LETTER)   /* if a letter */
+        ||  (ccl == C_POINT)    /* or a decimal point */
+        ||  (ccl == C_SIGN)) {  /* or a sign follows, */
+          state = S_ID; break;  /* go to 'identifier' state */
+        }                       /* otherwise */
+        UNGETC(scan, c);        /* put back last character, */
+        *--p = '\0';            /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token = T_NUM;      /* and return 'number' */
+      case S_SIGN:              /* --- number (sign read) */
+        *p++ = c;               /* buffer character */
+        if  (ccl == C_DIGIT) {       /* if a digit follows, */
+          state = S_NUMDIG; break; } /* go to 'number' state */
+        if  (ccl == C_POINT) {       /* if a decimal point follows, */
+          state = S_NUMPT; break; }  /* go to fraction state */
+        if ((c == '-')          /* if a '-' follows and previous */
+        &&  (scan->value[0] == '-')) {  /* char was a minus sign */
+          *p = '\0'; scan->len = 2; return scan->token = T_DASH; }
+        if ((c == '>')          /* if a '>' follows and previous */
+        &&  (scan->value[0] == '-')) {  /* char was a minus sign */
+          *p = '\0'; scan->len = 2; return scan->token = T_RGT; }
+        if ((ccl == C_LETTER)        /* if a letter */
+        ||  (ccl == C_SIGN)) {       /* or a sign follows, */
+          state = S_ID; break; }     /* go to 'identifier' state */
+        UNGETC(scan, c);        /* otherwise put back last character, */
+        *--p = '\0';            /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token = T_ID;   /* and return 'identifier' */
+      case S_CMPOP:             /* --- comparison operator read */
+        if ((c == '-')          /* if a minus sign follows and */
+        &&  (scan->value[0] == '<')) {  /* prev. char was a '<' */
+          *p++ = '-';       scan->token = T_LFT; }
+        else if (c == '=') {    /* if an equal sign follows */
+          *p++ = '=';       scan->token = T_CMP; }
+        else {                  /* if anything else follows */
+          UNGETC(scan, c);  scan->token = scan->value[0]; }
+        *p = '\0';              /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token;        /* and return the token read */
+      case S_STRING:            /* --- quoted string */
+        if ((c == '\n') || (c == EOF))  /* if end of line or file, */
+          return scan->token = E_UNTSTR;   /* string is unterminated */
+        if (c != quote) {       /* if not at end of string */
+          if (p >= end) return scan->token = E_BUFOVF;
+          if (c == '\\') {      /* if escaped character follows, */
+            state = S_ESC; break; }  /* go to escaped char state */
+          *p++ = c; break;      /* otherwise buffer character */
+        }                       /* if at end of string, */
+        *p = '\0';              /* terminate string in buffer */
+        scan->len = (int)(p -scan->value); /* set string length */
+        return scan->token = T_ID;   /* and return 'identifier' */
+      case S_ESC:               /* --- after '\' in quoted string */
+        if ((c >= '0') && (c <= '7')) {        /* if octal digit, */
+          ec = c -'0'; state = S_OCT1; break; }/* evaluate digit  */
+        if (c == 'x') {         /* if hexadecimal character code, */
+          state = S_HEX1; break;} /* go to hexadecimal evaluation */
+        switch (c) {            /* evaluate character after '\' */
+          case  'a': c = '\a'; break;
+          case  'b': c = '\b'; break;
+          case  'f': c = '\f'; break;
+          case  'n': c = '\n'; break;
+          case  'r': c = '\r'; break;
+          case  't': c = '\t'; break;
+          case  'v': c = '\v'; break;
+          case '\n': c = -1;   break;
+          default  :           break;
+        }                       /* get escaped character */
+        if (c >= 0) *p++ = c;   /* and store it, then */
+        state = S_STRING; break;/* return to quoted string state */
+      case S_OCT1:              /* --- escaped octal number 1 */
+        if ((c >= '0')          /* if an octal digit follows, */
+        &&  (c <= '7')) {       /* evaluate it */
+          ec = ec *8 +c -'0'; state = S_OCT2; break; }
+        UNGETC(scan, c);        /* otherwise put back last character */
+        *p++  = ec;             /* store escaped character and */
+        state = S_STRING; break;/* return to quoted string state */
+      case S_OCT2:              /* --- escaped octal number 2 */
+        if ((c >= '0') || (c <= '7'))
+          ec = ec *8 +c -'0';   /* if octal digit, evaluate it */
+        else UNGETC(scan, c);   /* otherwise put back last character */
+        *p++  = ec;             /* store escaped character and */
+        state = S_STRING; break;/* return to quoted string state */
+      case S_HEX1:              /* --- escaped hexadecimal number 1 */
+        if (ccl == C_DIGIT) {   /* if hexadecimal digit, evaluate it */
+          ec = c -'0';     state = S_HEX2; break; }
+        if ((c >= 'a') && (c <= 'f')) {
+          ec = c -'a' +10; state = S_HEX2; break; }
+        if ((c >= 'A') && (c <= 'F')) {
+          ec = c -'A' +10; state = S_HEX2; break; }
+        UNGETC(scan, c);        /* otherwise put back last character */
+        *p++  = 'x';            /* store escaped character ('x') and */
+        state = S_STRING; break;/* return to quoted string state */
+      case S_HEX2:              /* --- escaped hexadecimal number 2 */
+        if (ccl == C_DIGIT)     /* if hexadecimal digit, evaluate it */
+          ec = ec*16 +c -'0';
+        else if ((c >= 'a') && (c <= 'f'))
+          ec = ec*16 +c -'a' +10;
+        else if ((c >= 'A') && (c <= 'F'))
+          ec = ec*16 +c -'A' +10;
+        else UNGETC(scan, c);   /* otherwise put back last character */
+        *p++  = ec;             /* store escaped character and */
+        state = S_STRING; break;/* return to quoted string state */
+      case S_SLASH:             /* --- slash '/' */
+        if (c == '/') {         /* if C++ style comment, then */
+          state = S_CPPCOM; break; }   /* skip to end of line */
+        if (c == '*') {         /* if C style comment */
+          scan->start = scan->line; level = 1;
+          state = S_CCOM1; break;    /* note start line, init. level */
+        }                       /* and go to first 'comment' state */
+        UNGETC(scan, c);        /* otherwise put back last character */
+        *p++ = '/'; *p = '\0';  /* store character in buffer */
+        scan->len = 1;          /* set string length and */
+        return scan->token = '/';  /* return `character' */
+      case S_CPPCOM:            /* --- C++ style comment */
+        if ((c == '\n')         /* if at end of line */
+        ||  (c == EOF))         /* or at end of file */
+          state = S_SPACE;      /* return to white space skipping */
+        break;                  /* (skip to end of line) */
+      case S_CCOM1:             /* --- C style comment 1 */
+        if      (c == EOF)      /* if end of file, abort */
+          return scan->token = E_UNTCOM;
+        if      (c == '*')      /* if possibly 'end of comment', */
+          state = S_CCOM2;      /* go to 2nd 'comment' state */
+        else if (c == '/')      /* if possibly 'start of comment', */
+          state = S_CCOM3;      /* go to 3rd 'comment' state */
+        break;
+      case S_CCOM2:             /* --- C style comment 2 */
+        if      (c == EOF)      /* if end of file, abort */
+          return scan->token = E_UNTCOM;
+        if      (c == '/') {    /* if end of comment found */
+          if (--level <= 0) state = S_SPACE;
+          else              state = S_CCOM1; }
+        else if (c != '*')      /* if end of comment impossible */
+          state = S_CCOM1;      /* return to comment skipping */
+        break;                  /* (possible start of comment) */
+      case S_CCOM3:             /* --- C style comment 3 */
+        if      (c == EOF)      /* if end of file, abort */
+          return scan->token = E_UNTCOM;
+        if      (c == '*') {    /* if start of comment found */
+          level++; state = S_CCOM1; }
+        else if (c != '/')      /* if start of comment impossible */
+          state = S_CCOM1;      /* return to comment skipping */
+        break;                  /* (possible end of comment) */
+      default:                  /* if state is invalid, abort */
+        return scan->token = E_STATE;
+    }  /* switch() */
+  }  /* while(1) */
+}  /* sc_next() */
+/*--------------------------------------------------------------------*/
+int sc_nexter (SCAN *scan)
+{                               /* --- get next token error reporting */
+  if (sc_next(scan) < 0) return sc_error(scan, scan->token);
+  return scan->token;           /* get next token, report error, */
+}  /* sc_nexter() */            /* and return next token */
+/*--------------------------------------------------------------------*/
+int sc_back (SCAN *scan)
+{                               /* --- go back one token */
+  if (scan->back)               /* a second step backwards */
+    return scan->token;         /* is impossible, so do nothing */
+  scan->back = -1;              /* set the step backward flag */
+  return _swap(scan);           /* swap the token information */
+}  /* sc_back() */              /* and return the previous token */
+/*--------------------------------------------------------------------*/
+int sc_eof (SCAN *scan)
+{                               /* --- check for end of file */
+  if (scan->token == T_EOF) return 1;
+  sc_error(scan, E_GARBAGE);    /* check for end of file */
+  return 0;                     /* and report an error */
+}  /* sc_eof() */               /* if it is not reached */
+/*--------------------------------------------------------------------*/
+int sc_recover (SCAN *scan, int stop, int beg, int end, int level)
+{                               /* --- recover from an error */
+  while ((scan->token != stop)     /* while at stop token */
+  &&     (scan->token != T_EOF)) { /* and not at end of file */
+    if       (scan->token == beg)  /* if begin level token found, */
+      level++;                     /* increment level counter */
+    else if ((scan->token == end)  /* if end level token found */
+    &&       (--level    <= 0))    /* and on level to return to, */
+      break;                       /* abort loop */
+    if (sc_next(scan) < 0) return scan->token;
+  }                             /* consume token */
+  if (scan->token != T_EOF)     /* if not at end of file, */
+    sc_next(scan);              /* consume token (stop or end) */
+  return scan->token;           /* return the next token */
+}  /* sc_recover() */
+/*--------------------------------------------------------------------*/
+void sc_errfile (SCAN *scan, FILE *file, int lncnt)
+{                               /* --- set file for error output */
+  assert(scan);                 /* check the function arguments */
+  scan->errfile = (file) ? file : stderr;
+  scan->lncnt   = lncnt;        /* set file and line count */
+}  /* sc_errfile() */
+/*--------------------------------------------------------------------*/
+void sc_errmsgs (SCAN *scan, const char *msgs[], int cnt)
+{                                /* --- set additonal error messages */
+  assert(scan);                  /* check the function arguments */
+  scan->msgs   = msgs;           /* note error message vector */
+  scan->msgcnt = cnt;            /* and number of error messages */
+}  /* sc_errmsgs() */
+/*--------------------------------------------------------------------*/
+int sc_error (SCAN *scan, int code, ...)
+{                               /* --- print an error message */
+  va_list    args;              /* variable argument list */
+  const char *msg;              /* error message */
+  int        c, pc;             /* the invalid character */
+  int        tmp;               /* temporary buffer */
+  assert(scan);                  /* check the function arguments */
+  if (scan->lncnt <= 0)         /* if line count is zero or negative, */
+    putc('\n', scan->errfile);  /* start a new output line */
+  fprintf(scan->errfile, FILETXT" %s", scan->fname);
+                                /* print the file name */
+  if ((code != E_NONE)          /* if an error occurred, */
+  &&  (code != E_FOPEN)         /* but not 'file open failed' */
+  &&  (code != E_UNTCOM)) {     /* and not 'unterminated comment' */
+    fputs((scan->lncnt > 2) ? ",\n" : ", ", scan->errfile);
+    fprintf(scan->errfile, LINETXT" %d", scan->line);
+  }                             /* print line number */
+  fputs((scan->lncnt > 1) ? ":\n" : ": ", scan->errfile);
+  if (code >= 0) code = E_NONE; /* check error code and */
+  tmp = MSGOFFSET -code;        /* get error message text */
+  if      (code > E_UNKNOWN)    msg = _errmsgs[-code];
+  else if (tmp  < scan->msgcnt) msg = scan->msgs[tmp];
+  else                          msg = NULL;
+  if (!msg) msg = _errmsgs[-(code = E_UNKNOWN)];
+  switch (code) {               /* special error handling */
+    case E_CHAR  : c = pc = (unsigned char)scan->value[0];
+                   if (c < ' ') pc = ' ';
+                   fprintf (scan->errfile, msg, pc, c);       break;
+    case E_UNTCOM: fprintf (scan->errfile, msg, scan->start); break;
+    default      : va_start(args, code); /* get variable arguments */
+                   vfprintf(scan->errfile, msg, args);
+                   va_end(args); break;  /* print error message and */
+  }                             /* end variable argument evaluation */
+  if (scan->lncnt > 0)          /* if line count is positive, */
+    putc('\n', scan->errfile);  /* terminate output line */
+  return code;                  /* return error code */
+}  /* sc_error() */
+#endif