Mercurial > ~dholland > hg > ag > index.cgi

diff examples/mpp/ts.syn @ 0:13d2b8934445
Import AnaGram (near-)release tree into Mercurial.
author: David A. Holland
date: Sat, 22 Dec 2007 17:52:45 -0500
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/examples/mpp/ts.syn	Sat Dec 22 17:52:45 2007 -0500
@@ -0,0 +1,1096 @@
+{
+/*
+ * AnaGram, a System for Syntax Directed Programming
+ * C Macro preprocessor and parser
+ * TS.SYN: Token Scanner Module
+ *
+ * Copyright 1993-2000 Parsifal Software. All Rights Reserved.
+ *
+ * This software is provided 'as-is', without any express or implied
+ * warranty.  In no event will the authors be held liable for any damages
+ * arising from the use of this software.
+ *
+ * Permission is granted to anyone to use this software for any purpose,
+ * including commercial applications, and to alter it and redistribute it
+ * freely, subject to the following restrictions:
+ *
+ * 1. The origin of this software must not be misrepresented; you must not
+ *    claim that you wrote the original software. If you use this software
+ *    in a product, an acknowledgment in the product documentation would be
+ *    appreciated but is not required.
+ * 2. Altered source versions must be plainly marked as such, and must not be
+ *    misrepresented as being the original software.
+ * 3. This notice may not be removed or altered from any source distribution.
+ */
+
+#include "mpp.h"
+
+
+// context structure for diagnostics
+
+struct location { unsigned line, column; };
+
+}
+
+
+// Configuration section
+
+[
+  // far tables                       // uncomment for 16 bit environment
+  context type = location             // request context tracking
+ ~allow macros                        // function defs for red procs
+  auto resynch
+  line numbers                        // #line statements in output
+  error trace                         // build trace on syntax error
+ ~test range                          // not necessary
+ ~declare pcb                         // pcb declared manually
+ ~error frame                         // not wanted for diagnostics
+
+  subgrammar {                        // this subgrammar statement
+    simple token,                     // will be removed and replaced
+    expanded token,                   // with "disregard ws" and
+    initial arg element,              // lexeme statements in the
+    ws,                               // next revision
+    eol,
+    macro definition header,
+  }
+  parser file name = "#.cpp"
+]
+
+
+// Character Set Definitions
+
+any text char   = ~eof - newline - '\\'
+ascii           = 1..126
+blank           = ' ' + '\t' + '\r' + '\f' + '\v'
+digit           = '0-9'
+eof             = -1 + 0
+hex digit       = '0-9' + 'A-F' + 'a-f'
+newline         = '\n'
+letter          = 'a-z' + 'A-Z' + '_'
+not punctuation = '#' + blank + letter + digit + '\'' + '"' + newline + '\\'
+punctuation     = ascii - not punctuation
+simple char     = ~eof - ('\'' + '\\' + '\n')
+string char     = ~eof - ('"' + '\\' + '\n')
+
+
+// Grammar, or Start token
+
+/*
+ The macro/#include structure of a C/C++ program is line oriented, so the
+ main grammar treats the input file as logical sections, separated by
+ any number of new lines.
+
+ eol is defined so that it accepts any number of blank lines and any leading
+ spaces on the first following nonblank line. Lines containing only comments
+ are considered blank lines.
+
+ Input text, as it is recognized is sunk through the scanner_sink pointer.
+ scanner_sink is normally the output of the scanner, but when it is necessary
+ to accumulate text, as for a macro definition, scanner_sink is switched to
+ direct text to a buffer. When the end of the macro definition is encountered,
+ the scanner_sink is switched back to its previous setting.
+*/
+
+input file $                                // Grammar Token
+ -> [section | eol]/..., eof                // Alternating sequence
+
+eol
+ -> newline, [newline | space]...
+
+
+/*
+ Conditional Compilation Control
+
+ This is the portion of the grammar that parsers #if/#ifdef#ifndef/#elif/#else/#endif
+ and determines which lines of text are to be passed on for further processing
+ and which are to be simply ignored.
+
+ A "section" is any nonblank line of input, or an if/endif block of lines
+ that should be passed on to the C compiler.
+
+ A "skip_section" is a non blank line of input or and if/endif block of lines
+ that should be passed over and ignored.
+
+ "expanded token" represents the _result_ of macro substitution
+
+ "control line" is any line beginning with # that is not an if/elsif/endif
+ line.
+
+ A conditional block is everything from an #if, #ifdef, #ifndef to the
+ matching #endif
+*/
+
+section
+ -> expanded token...                       =*scanner_sink << op('\n');
+ -> control line
+ -> conditional block
+
+/*
+ There are basically two syntaxes for the body of any block of text
+ controlled by an #if statement: One syntax, "true if section", to be used
+ if the if condition is true and one, "false if section", to be used to skip
+ over it if the condition is false. In like manner, there are two syntaxes
+ for the body of the else block: "skip else section" to be used when the
+ if condition is true and "else section", to be used when the if condition
+ is false.
+
+ The syntax for "conditional block" enumerates all possible combinations.
+
+This simple analysis is complicated by the existence of the #elif statement.
+This complication occasions a moderately complex cross recursion between
+"true if section" and "false if section".
+
+Note that a "false if section" is a false #if line followed by all
+statements up to an #else statement or a true #elif line. A "true if
+section" consists of a true #if line followed by everything up to the
+next matching #elif or #else line, or it consists of false if sections
+followed eventually by a true #elif line and then subsequent lines
+up to a following #else or #elif line.
+
+"skip section" is syntax to skip over any text including matched
+#if/#ifdef/#ifndef, #endif pairs.
+*/
+
+conditional block
+ -> true if section, eol, endif line
+ -> true if section, eol, skip else section, eol, endif line
+ -> false if section, eol, endif line
+ -> false if section, eol, else section, eol, endif line
+
+true if section
+ -> true condition
+ -> true if section, eol, section
+ -> false if section, eol, true else condition
+
+false if section
+ -> false condition
+ -> false if section, eol, skip section
+ -> false if section, eol, false else condition
+
+/*
+ "else section" handles lines of text (and nested #if/#endif sections
+ starting with an #else line. "else section" should always be followed
+ in any syntactic use by eol, endif line to terminate the looping.
+*/
+
+else section
+ -> '#', ws?, "else", ws?
+ -> else section, eol, section
+
+endif line
+ -> '#', ws?, "endif", ws?
+
+/*
+ "skip section" skips a single line, or an entire if/endif block
+*/
+
+skip section
+ -> skip line
+ -> skip if section, eol, endif line
+
+/*
+ "skip if section" can be terminated only by an "endif line"
+ Note that it simply skips over #else and #elif lines, since
+ they are immaterial in context.
+*/
+
+skip if section
+ -> '#', ws?, {"if" | "ifdef" | "ifndef"}, any text?...
+ -> skip if section, eol, skip section
+ -> skip if section, eol, skip else line
+
+/*
+ "skip else section" begins with an #elif or #else line and continues
+ to a terminating #endif line.
+*/
+
+skip else section
+ -> skip else line
+ -> skip else section, eol, skip else line
+ -> skip else section, eol, skip section
+
+skip else line
+ -> '#', ws?, "elif", any text?...
+ -> '#', ws?, "else", ws?
+
+/*
+ "skip line" parses over and ignores any line that is not an
+ #if, #elif, #else, or #endif line.
+*/
+
+skip line
+ -> '#', ws?, [{"define" | "undefine" | "include" | "line" |
+                    "error" | "pragma"}, any text?...]
+ -> not control mark, any text?...
+
+any text
+ -> any text char
+ -> '\\', ~eof
+
+not control mark
+ -> any text char - '#'
+ -> '\\', ~eof
+
+
+/*
+ Conditional Control Lines
+
+ A semantically determined production is used to determine whether
+ an #if, #ifdef, or #ifndef line should be treated as a true
+ condition or a false condition. #ifdef and #ifndef can be
+ resolved simply by determining whether a symbol has or has
+ not been defined. #if is more complex and requires
+ evaluation of a constant expression. It does this by passing
+ the expanded argument string to the expression evaluator
+ in ex.syn
+*/
+
+true condition, false condition
+ -> '#', ws?, "ifdef", ws, name string, ws?           =check_defined(1);
+ -> '#', ws?, "ifndef", ws, name string, ws?          =check_defined(0);
+ -> '#', ws?, if header, expanded token...            =eval_if();
+
+true else condition, false else condition
+ -> '#', ws?, else if header, expanded token...       =eval_elif();
+
+/*
+ "if header" and "else if header" are simple wrapper tokens to
+ provide a hook for marking the beginning of the text that
+ is to be used by the expression evaluator. The init_condition()
+ function handles this task.
+*/
+
+if header
+ -> "if", ws                                          =init_condition();
+
+else if header
+ -> "elif", ws                                        =init_condition();
+
+
+/*
+ Other Control Lines
+
+ Relative to the complexity of the if/elif/else/endif logic, other
+ control lines are moderately straightforward.
+
+ The #include file is handled simply by stacking the current file
+ position and opening the indicated file. When end of file is
+ encountered on the newly opened file, the current file position
+ will be unstacked and parsing will continue as though nothing
+ had happened.
+
+ Note that there is nothing that requires that an #if/#ifdef#ifndef
+ and the matching #endif be in the same file.
+
+ #undef is trivial
+
+ #line, #error, #pragma lines are simply ignored
+
+ #define has substantial struture. It begins with the header portion
+ that identifies the macro to be defined and coninues with the
+ body of the macro definition. "macro definition header" identifies
+ the name and type of the macro and initializes the accumulation of
+ the tokens which comprise the body of the macro.
+*/
+
+control line
+ -> include header, expanded token...                 =include_file();
+ -> '#', ws?, "undef", ws, name string, ws?           =undefine();
+ -> '#', ws?, [{"line" | "error" | "pragma"}, any text?...]
+ -> macro definition header:id, simple token?...      =save_macro_body(id);
+
+include header
+ -> '#', ws?, "include" =save_sink << scanner_sink, scanner_sink = &++ta;
+
+
+/*
+ Macro Definitions
+
+ There are two types of macros: those with arguments and those without.
+ They are rather different in the way they have to be handled.
+*/
+
+(int) macro definition header
+ -> '#', ws?, "define", ws, name string         =init_macro_def(0,0);
+ -> '#', ws?, "define", ws, name string,
+      '(', ws?, parameter list:n, ')'          =init_macro_def(n,1);
+
+(int) parameter list
+ ->                                       =0;
+ -> names, ws?
+
+(int) names
+ -> name string                           =1;
+ -> names:n, ws?, ',', ws?, name string   =n+1;
+
+/*
+ Unexpanded text (for macro definitions)
+
+ If there are macro invocations in the body of a macro, they are
+ supposed to be expanded only when the macro itself is invoked, not
+ when the macro is defined. This means that the processing of
+ the body of the macro definition has to be different from the
+ processing of ordinary text.
+
+ simple token is a token as it appears in the input stream.
+
+ expanded token is the result of passing a token through macro
+ expansion.
+*/
+
+simple token
+ -> space:c                               =*scanner_sink << space_op(c);
+ -> word
+ -> separator
+ -> '#'                                   =*scanner_sink << op('#');
+ -> qualified real
+ -> integer constant
+
+word
+ -> name string                           =*scanner_sink << name_token();
+
+
+// Expanded text
+
+expanded token
+ -> expanded word
+ -> separator
+ -> space
+ -> qualified real
+ -> integer constant
+
+/*
+ The semantically determined production below classifies a name string
+ into the categories variable, simple macro, macro or defined (as in #if defined(x))
+ so that the parser can do appropriate follow up parsing.
+
+ expand() is called to expand macros. Note that a macro that is defined with
+ an parameter list (whether or not the list is empty) is not expanded unless
+ it is invoked with a parameter list.
+*/
+
+expanded word
+ -> variable:t                                    =*scanner_sink << t;
+ -> simple macro:t                                =expand(t,0);
+ -> macro:t, ws?                                  =*scanner_sink << t;
+ -> macro:t, ws?, '(', ws?, macro arg list:n, ')' =expand(t,n);
+ -> defined, ws?, '(', ws?, name string, ws?, ')' =*scanner_sink << defined();
+ -> defined, ws, name string                      =*scanner_sink << defined();
+
+
+// Name classification
+
+(token) variable, simple macro, macro, defined
+ -> name string                              =id_macro();
+
+
+/*
+ Macro Arguments
+
+ Macro arguments are accumulated as separate token strings on the
+ token accumulator stack.
+*/
+
+
+(int) macro arg list
+ ->                                          =0;
+ -> !save_sink << scanner_sink, scanner_sink = &ta;, macro args:n =
+     save_sink >> scanner_sink, n;
+
+(int) macro args
+ -> increment ta, arg elements                              =1;
+ -> macro args:n, ',', ws?, increment ta, arg elements      =n+1;
+
+// increment ta could be replaced with an "immediate action"
+
+(void) increment ta
+ ->  /* Null Production */ =++ta;
+
+/*
+ The following is somewhat complex partly to skip leading space.
+*/
+
+arg elements
+ -> initial arg element
+ -> arg elements, arg element
+
+arg element
+ -> space:c                              =*scanner_sink << space_op(c);
+ -> initial arg element
+
+initial arg element
+ -> name string                          =*scanner_sink << name_token();
+ -> qualified real
+ -> integer constant
+ -> string literal                  =*scanner_sink << tkn(STRINGliteral);
+ -> character constant              =*scanner_sink << tkn(CHARACTERconstant);
+ -> operator
+ -> punctuation - '(' - ',' - ')':p      =*scanner_sink << op(p);
+ -> nested elements, ')':t               =*scanner_sink << op(t);
+
+nested elements
+ -> '(':t                                =*scanner_sink << op(t);
+ -> nested elements, arg element
+ -> nested elements, ',':t               =*scanner_sink << op(t);
+
+
+/*
+ Basic lexical elements
+
+ The remainder of the syntax file consists of the definitions of the
+ basic lexical elements of C.
+
+ The basic lexical elements are simply copied to the scanner_sink as
+ they are encountered. Note that it is not the character string itself
+ that goes to the scanner_sink but rather a token which consists of
+ a type identification and a handle that can be used to recover the
+ string from a dictionary.
+*/
+
+separator
+ -> string literal        =*scanner_sink << tkn(STRINGliteral);
+ -> character constant    =*scanner_sink << tkn(CHARACTERconstant);
+ -> operator
+ -> punctuation:p         =*scanner_sink << op(p);
+ -> '\\', '\n'
+
+(int) space
+ -> blank
+ -> comment                                  =' ';
+
+ws = space...
+
+comment
+ -> comment head, "*/"
+
+comment head
+ -> "/*"
+ -> comment head, ~eof
+
+comment, comment head
+ -> comment head, comment ={if (nest_comments) CHANGE_REDUCTION(comment_head);}
+
+operator
+ -> '&', '&'                  =*scanner_sink << op(ANDAND);
+ -> '&', '='                  =*scanner_sink << op(ANDassign);
+ -> '-', '>'                  =*scanner_sink << op(ARROW);
+ -> '#', '#'                  =*scanner_sink << op(CONCAT);
+ -> '-', '-'                  =*scanner_sink << op(DECR);
+ -> '/', '='                  =*scanner_sink << op(DIVassign);
+ -> '.', '.', '.'             =*scanner_sink << op(ELLIPSIS);
+ -> '=', '='                  =*scanner_sink << op(EQ);
+ -> '^', '='                  =*scanner_sink << op(ERassign);
+ -> '>', '='                  =*scanner_sink << op(GE);
+ -> '+', '+'                  =*scanner_sink << op(ICR);
+ -> '<', '='                  =*scanner_sink << op(LE);
+ -> '<', '<'                  =*scanner_sink << op(LS);
+ -> '<', '<', '='             =*scanner_sink << op(LSassign);
+ -> '%', '='                  =*scanner_sink << op(MODassign);
+ -> '-', '='                  =*scanner_sink << op(MINUSassign);
+ -> '*', '='                  =*scanner_sink << op(MULTassign);
+ -> '!', '='                  =*scanner_sink << op(NE);
+ -> '|', '='                  =*scanner_sink << op(ORassign);
+ -> '|', '|'                  =*scanner_sink << op(OROR);
+ -> '+', '='                  =*scanner_sink << op(PLUSassign);
+ -> '>', '>'                  =*scanner_sink << op(RS);
+ -> '>', '>', '='             =*scanner_sink << op(RSassign);
+
+
+// Numeric constants
+
+qualified real
+ -> real constant, floating qualifier =*scanner_sink << tkn(FLOATconstant);
+
+real constant
+ -> real
+
+floating qualifier
+ ->
+ -> 'f' + 'F'             =sa << 'F';
+ -> 'l' + 'L'             =sa << 'L';
+
+real
+ -> simple real
+ -> simple real, exponent
+ -> confusion, exponent
+ -> decimal integer, exponent
+
+simple real
+ -> confusion, '.'                         =sa << '.';
+ -> octal integer, '.'
+ -> decimal integer, '.'                   =sa << '.';
+ -> '.', '0-9':d                           =++sa << '.' << d;
+ -> simple real, '0-9':d                   =sa << d;
+
+confusion
+  -> octal integer, '8-9':d                =sa << d;
+  -> confusion, '0-9':d                    =sa << d;
+
+exponent
+  -> 'e' + 'E', '-', '0-9':d               =sa << '-' << d;
+  -> 'e' + 'E', '+'?, '0-9':d              =sa << '+' << d;
+  -> exponent, '0-9':d                     =sa << d;
+
+integer qualifier
+  -> 'u' + 'U'                       =sa << 'U';
+  -> 'l' + 'L'                       =sa << 'L';
+
+integer constant
+ -> octal constant                        =*scanner_sink << tkn(OCTconstant);
+ -> decimal constant                      =*scanner_sink << tkn(DECconstant);
+ -> hex constant                          =*scanner_sink << tkn(HEXconstant);
+
+octal constant
+ -> octal integer
+ -> octal constant, integer qualifier
+
+octal integer
+  -> '0'                                 =++sa << '0';
+  -> octal integer, '0-7':d              =sa << d;
+
+hex constant
+ -> hex integer
+ -> hex constant, integer qualifier
+
+hex integer
+  -> '0', 'x' + 'X', hex digit:d         =++sa << "0X" << d;
+  -> hex integer, hex digit:d            =sa << d;
+
+decimal constant
+ -> decimal integer
+ -> decimal constant, integer qualifier
+
+decimal integer
+  -> '1-9':d                               =++sa << d;
+  -> decimal integer, '0-9':d              =sa << d;
+
+
+// String Literals and Character Constants
+
+string literal
+  -> string chars, '"'                     =sa << '"';
+
+string chars
+ -> '"'                                    =++sa << '"';
+ -> string chars, string char:c            =sa << c;
+ -> string chars, '\\', ~eof - '\n':c      =sa << '\\' << c;
+ -> string chars, '\\', '\n'
+
+
+// Character constants
+
+character constant
+ -> simple chars, '\''                     =sa << '\'';
+
+simple chars
+ -> '\''                                   =++sa << '\'';
+ -> simple chars, simple char:c            = sa << c;
+ -> simple chars, '\\', ~eof - '\n': c     = sa << '\\' << c;
+ -> simple chars, '\\', '\n'
+
+
+// Identifiers
+
+name string
+  -> letter:c                              =++sa << c;
+  -> name string, letter+digit:c           =sa << c;
+
+
+{                                      // Embedded C
+#include "array.h"                     // \AnaGram\classlib\include\array.h
+#include "stack.h"                     // \AnaGram\classlib\include\stack.h
+#if defined(__MSDOS__) || defined(__WIN32__)
+#include <io.h>                        // If not found, not necessary
+#endif
+#include <sys/types.h>                 // If not found, not necessary
+#include <sys/stat.h>
+#include <fcntl.h>
+
+
+// Macro Definitions
+
+#define SYNTAX_ERROR syntax_error_scanning(PCB.error_message)
+#define GET_CONTEXT (CONTEXT.line = PCB.line, CONTEXT.column = PCB.column)
+#define GET_INPUT (PCB.input_code = getc(input.file))
+#define PCB input.pcb
+
+
+// Structure Definition
+
+struct file_descriptor {
+  char *name;                          // name of file
+  FILE *file;                          // source of input characters
+  ts_pcb_type pcb;                     // parser control block for file
+};
+
+typedef stack<file_descriptor> file_descriptor_stack;
+
+// Static Data Declarations
+
+static const char            *error_modifier = "";
+static file_descriptor        input;
+static stack<token_sink *>    save_sink(5);
+static file_descriptor_stack  active_files(20);
+
+// Syntax Error Reporting
+/*
+ syntax_error() provides an error diagnostic procedure for those
+ parsers which are called by the token scanner. error_modifier is set
+ by expand() so that an error encountered during a macro expansion
+ will be so described.  Otherwise, the diagnostic will not make
+ sense.
+
+ Since all other parsers are called from reduction procedures, the
+ line and column number of the token they are dealing with is given
+ by the context of the token scanner production that is being
+ reduced.
+*/
+
+void syntax_error(const char *msg)  {
+  printf("%s: Line %d, Column %d: %s%s\n",
+   input.name, CONTEXT.line, CONTEXT.column, msg, error_modifier);
+}
+
+/*
+ syntax_error_scanning() provides an error diagnostic procedure for
+ the token scanner itself. The locus of the error is given by the
+ current line and column number of the token scan, as given in the
+ parser control block.
+*/
+
+static void syntax_error_scanning(const char *msg)  {
+  printf("%s: Line %d, Column %d: %s\n",
+    input.name, PCB.line, PCB.column, msg);
+}
+
+
+// Support for Reduction Procedures
+/*
+ name_token() looks up the name string in the string accumulator,
+ identifies it in the token dictionary, checks to see if it is a
+ reserved word, and creates a token.
+*/
+
+static token name_token(void) {
+  token t;
+  t.id = NAME;
+  t.handle = td << sa.top();
+  --sa;
+  if (t.handle <= n_reserved_words) t.id = reserved_words[t.handle].id;
+  return t;
+}
+
+/*
+ op() creates a token for a punctuation character.
+*/
+
+static token op(unsigned x) {
+  token t;
+  t.id = (token_id) x;
+  t.handle = token_handles[x];
+  return t;
+}
+
+/*
+ space_op() creates a token for a space character. Note that a space
+ could be a tab, vertical tab, or form feed character as well as a
+ blank.
+*/
+
+static token space_op(unsigned x) {
+  token t;
+  t.id = (token_id) ' ';
+  t.handle = token_handles[x];
+  return t;
+}
+
+/*
+ tkn() creates a token with a specified id for the string on the top
+ of the string accumulator
+*/
+
+static token tkn(token_id id) {
+  token t;
+  t.id = id;
+  t.handle = td << sa.top();
+  --sa;
+  return t;
+}
+
+
+// Macro Processing Procedures
+
+/*
+ check_defined() looks up the name on the string accumulator to see if
+ it is the name of a macro. It then selects a reduction token according
+ to the outcome of the test and an input flag.
+*/
+
+static void check_defined(int flag) {
+  unsigned id = macro_id[td[sa.top()]];
+  --sa;
+  flag ^= id != 0;
+  if (flag) CHANGE_REDUCTION(false_condition);
+  else CHANGE_REDUCTION(true_condition);
+}
+
+/*
+ defined() returns a decimal constant token equal to one or zero
+ depending on whether the token named on the string accumulator is or
+ is not defined as a macro
+*/
+
+static token defined(void) {
+  unsigned id = macro_id[td[sa.top()]];
+  token t;
+  t.id = DECconstant;
+  t.handle = id ? one_value : zero_value;
+  --sa;
+  return t;
+}
+
+/*
+ expand() expands and outputs a macro. t.handle is the token dictionary
+ index of the macro name. n is the number of arguments found.
+
+ Since it is possible that scanner sink is pointing to ta, it is
+ necessary to pop the expanded macro from ta before passing it on to
+ scanner_sink. Otherwise, we would have effectively ta << ta, a
+ situation which causes an infinite loop.
+*/
+
+static void expand(token t, unsigned n) {
+  error_modifier = " in macro expansion"; // fix error diagnostic
+  expand_macro(t,n);                      // Defined in MAS.SYN
+  if (size(ta)) {
+    array<token> x(ta,size(ta) + 1);
+    --ta;
+    *scanner_sink << x;
+  } else --ta;
+  error_modifier = "";
+}
+
+/*
+ Look up the name string on the string accumulator. Determine whether
+ it is a reserved word, or a simple identifier. Then determine
+ whether it is the name of a macro.
+*/
+
+static token id_macro(void) {
+  token t;
+  unsigned id;
+
+  t.id = NAME;
+  t.handle = td << sa.top();
+  --sa;
+  if (t.handle <= n_reserved_words) t.id = reserved_words[t.handle].id;
+
+  if (if_clause && t.handle == defined_value) {
+    CHANGE_REDUCTION(defined);
+    return t;
+  }
+  id = macro_id[t.handle];
+  if (id == 0) return t;
+
+  if (macro[id].parens) CHANGE_REDUCTION(macro);
+  else CHANGE_REDUCTION(simple_macro);
+  return t;
+}
+
+/*
+ Start a macro definition. This procedure defines all but the body of
+ the macro.
+
+ nargs is the count of parameters that were found.  flag is set if
+ the macro was defined with parentheses.
+
+ The parameter names are on the string accumulator, with the last
+ name on the top of the stack, so they must be popped off, identified
+ and stored in reverse order.
+
+ The name of the macro is beneath the parameter names on the string
+ accumulator.
+
+ Before returning, this procedure saves the current value of
+ scanner_sink, increments the level on the token stack and sets
+ scanner_sink so that subsequent tokens produced by the token scanner
+ will accumulate on the token stack. These tokens comprise the body
+ of the macro. When the end of the macro body is encountered, the
+ procedure save_macro_body will remove them from the token stack and
+ restore the value of scanner_sink.
+*/
+
+static int init_macro_def(int nargs, int flag) {
+  int k;
+  int id = ++n_macros;
+  unsigned name;
+  unsigned *arg_list = nargs ? new unsigned[nargs] : NULL;
+
+  assert(id < N_MACROS);
+  for (k = nargs; k--;) {
+    arg_list[k] = td << sa.top();
+    --sa;
+  }
+
+  macro[id].arg_names = arg_list;
+  macro[id].n_args = nargs;
+
+  macro[id].name = name = td << sa.top();
+  --sa;
+
+  macro_id[name] = id;
+
+  macro[id].busy_flag = 0;
+  macro[id].parens = flag ;
+
+  save_sink << scanner_sink;
+  scanner_sink = &++ta;
+  return id;
+}
+
+/*
+ save_macro_body() finishes the definition of a macro by making a
+ permanent copy of the token string on the token accumulator. It then
+ restores the scanner_sink to the value it had when the macro
+ definition was encountered.
+*/
+
+static void save_macro_body(int id) {
+  macro[id].body = size(ta) ? copy(ta) : NULL;
+  --ta;
+  save_sink >> scanner_sink;
+}
+
+/*
+ undefine() deletes the macro definition for the macro whose name is
+ on the top of the string accumulator. If there is no macro with the
+ given name, undefine simply returns.
+
+ Otherwise, it frees the storage associated with the macro. It then
+ fills the resulting hole in the table with the last macro in the
+ table. The macro_id table is updated appropriately.
+*/
+
+static void undefine(void) {
+  unsigned name = td << sa.top();
+  int id = macro_id[name];
+  --sa;
+  if (id == 0) return;
+  macro_id[name] = 0;
+  if (macro[id].arg_names) delete [] macro[id].arg_names;
+  if (macro[id].body) delete [] macro[id].body;
+  macro[id] = macro[n_macros--];
+  macro_id[macro[id].name] = id;
+}
+
+
+// Include file procedures
+
+/*
+ file_name() interprets the file name provided by an #include
+ statement. If the file name is enclosed in <> brackets it scans the
+ directory list in paths to try to find the file. If it finds it, it
+ prefixes the path to the file name.
+
+ If the file name is enclosed in "" quotation marks, file_name()
+ simply strips the quotation marks.
+
+ If file_name() succeeds, it returns 1 and provides path-name in the
+ string accumulator, otherwise it returns 0 and nothing in the string
+ accumulator.
+
+ Note that file name uses a temporary string accumulator, lsa.
+*/
+
+static int file_name(char *file) {
+  int c;
+  int tc;
+  string_accumulator lsa(100);       // for temporary storage of name
+
+  while (*file == ' ') file++;
+  tc = *file++;
+  if (tc == '<') tc = '>';
+  else if (tc != '"') return 0;
+  while ((c = *file++) != 0 && c != tc) lsa << c;
+  if (c != tc) return 0;
+  if (tc == '"') {
+    int k, n;
+    active_files << input;
+    n = size(active_files);
+
+    while (n--) {
+      FILE *f;
+#ifdef _MSC_VER                  //Cope with peculiarity of MSVC++
+      char *cp;
+      int junk;
+
+      ++sa << ((file_descriptor *)active_files)[n].name;
+      k = size(sa);
+      cp = (char *)sa;
+      while (k-- && cp[k] != '\\' && cp[k] != '/') { sa >> junk;}
+#else
+      ++sa << active_files[n].name;
+      while (size(sa) && sa[0] != '\\' && sa[0] != '/') {
+         sa >> k;   // strip off current file name to leave only path
+      }
+#endif
+      sa << lsa;    // append desired file name
+      f = fopen(sa.top(),"rt");
+      if (f != NULL) {
+        fclose(f);
+        active_files >> input;
+        return 1;
+      }
+      --sa;
+    }
+    active_files >> input;
+  }
+  int k, n;
+  n = size(paths);
+  for (k = 0; k < n; k++) {
+    FILE *f;
+
+#ifdef _MSC_VER                  //Cope with peculiarity of MSVC++
+    ++sa << ((char **) paths)[k];
+    char c = ((char *)sa)[size(sa)-1];
+    if (size(sa) && c != '\\' && c != '/') sa << '/';
+#else
+    ++sa << paths[k];
+    if (size(sa) && sa[0] != '\\' && sa[0] != '/') sa << '/';
+#endif
+    sa << lsa;
+    f = fopen(sa.top(),"rt");
+    if (f != NULL) {
+      fclose(f);
+      return 1;
+    }
+    --sa;
+  }
+  return 0;
+}
+
+/*
+ include_file() is called in response to a #include statement.
+
+ First, it saves the file_descriptor for the current input. Then it
+ restores the scanner_sink which was saved prior to accumulating
+ macro expanded tokens on the token_accumulator.
+
+ When include_file() is called, the argument of the #include
+ statement exists in the form of tokens on the token accumulator.
+ These tokens are passed to a token_translator which turns the tokens
+ into a string on the string accumulator.
+
+ file_name() is then called to distinguish between "" and <> files.
+ In the latter case, file_name() prefixes a directory path to the name.
+ The name is then in the string accumulator.
+
+ scan_input() is then called to scan the include file.
+
+ Finally, before returning, the previous file_descriptor is restored.
+*/
+
+static void include_file(void) {
+  int flag;
+
+  save_sink >> scanner_sink;               // restore scanner_sink
+
+  token_translator tt(&++sa);
+  tt << ta;                                // recover string from tokens
+  --ta;                                    // discard token string
+
+  array<char> file(sa.top(), size(sa)+1);  // local copy of string
+  --sa;
+
+  flag = file_name(file);
+
+  if (!flag) {
+    fprintf(stderr, "Bad include file name: %s\n", (char *) file);
+    return;
+  }
+  array<char> path(sa.top(), size(sa) + 1);
+  --sa;
+  active_files << input;                     // Save current file
+  scan_input(path);                          // recursive call to ts()
+  active_files >> input;                     // Restore previous file
+  return;
+}
+
+
+// Conditional compilation procedures
+
+/*
+ init_condition() prepares for evaluation the condition expression in
+ #if and #elif statements.
+
+ It protects scanner_sink by pushing it onto the save_sink stack.
+ Then it resets the expression evaluatior, condition, and sets
+ scanner_sink to point to it.
+
+ Finally it sets the if_clause flag so that defined() will be handled
+ properly.
+*/
+
+static void init_condition(void) {
+  save_sink << scanner_sink;
+  scanner_sink = &reset(condition);
+  if_clause = 1;
+}
+
+/*
+ eval_condition() is called to deal with #if and #elif statements. The
+ init_condition() procedure has redirected scanner output to the
+ expression evaluator, so eval_condition() restores the previous
+ scanner destination.
+
+ It then sends an eof token to the expression evaluator, resets
+ if_clause and reads the value of the condition. Remember that
+ (long) condition returns the value of the expression.
+*/
+
+static int eval_condition(void) {
+  save_sink >> scanner_sink;
+  condition << op(0);                      // eof to exp evaluator
+  if_clause = 0;
+  return condition != 0L;
+}
+
+/*
+ In eval_if() and eval_elif() note the use of CHANGE_REDUCTION to
+ select the appropriate reduction token depending on the outcome of
+ the condition.
+*/
+
+static void eval_elif(void) {
+  if (eval_condition()) CHANGE_REDUCTION(true_else_condition);
+  else CHANGE_REDUCTION(false_else_condition);
+}
+
+static void eval_if(void) {
+  if (eval_condition()) CHANGE_REDUCTION(true_condition);
+  else CHANGE_REDUCTION(false_condition);
+}
+
+
+// Do token scan
+
+/*
+ scan_input()
+   1) opens the specified file, if possible
+   2) calls the parser
+   3) closes the input file
+*/
+
+void scan_input(char *path) {
+  input.file = fopen(path, "rt");
+  input.name = path;
+  if (input.file == NULL) {
+    fprintf(stderr,"Cannot open %s\n", (char *) path);
+    return;
+  }
+  ts();
+  fclose(input.file);
+}
+
+}                                      // End of Embedded C
author	David A. Holland
date	Sat, 22 Dec 2007 17:52:45 -0500
parents
children