home *** CD-ROM | disk | FTP | other *** search
- /*Program 4_3 - Simple gramatical parser using state tables
- by Stephen Davis, 1987
-
- Impliment a simple sentence parser using a state table approach.
- Program recognizes uppercase, lowercase, comma, space, period
- and newline.
- */
-
- #include <stdio.h>
- #include <ctype.h>
- #define maxcases 5
- enum chartype {invalid = 1, period,
- space, comma, newline,
- lowercase, uppercase};
- #define marker 0x5678
-
- /*prototype definitions --*/
- enum chartype evaluate (char);
- int parse (struct state **, char);
- void fixup (void);
- int main (void);
-
- /*grammatical state table*/
- struct state {
- unsigned signature;
- char currvalue;
- struct {
- enum chartype value;
- struct state *next;
- } choice [maxcases];
- struct state *error;
- } *current;
-
- struct state start = {marker, 0, {{uppercase, NULL /*&normal*/},
- {0, NULL},
- {0, NULL},
- {0, NULL},
- {0, NULL}},
- NULL /*&normal*/},
- normal= {marker, lowercase, {{lowercase, &normal},
- {space, NULL /*&break1*/},
- {comma, NULL /*&break2*/},
- {period, NULL /*&end1*/},
- {newline, NULL /*&begline*/}},
- &normal},
- break1= {marker, space, {{lowercase, &normal},
- {uppercase, &normal},
- {0, NULL},
- {0, NULL},
- {0, NULL}},
- &normal},
- break2= {marker, comma, {{space, &break1},
- {newline, NULL /*&begline*/},
- {0, NULL},
- {0, NULL},
- {0, NULL}},
- &normal},
- end1 = {marker, period, {{space, NULL /*&end2*/},
- {newline, &start},
- {0, NULL},
- {0, NULL},
- {0, NULL}},
- &start},
- end2 = {marker, space, {{space, &start},
- {0, NULL},
- {0, NULL},
- {0, NULL},
- {0, NULL}},
- &start},
- begline={marker, newline, {{uppercase, &normal},
- {lowercase, &normal},
- {0, NULL},
- {0, NULL},
- {0, NULL}},
- &normal};
-
-
- /*Evaluate - evaluate the current character. Return corresponding
- chartype*/
- enum chartype evaluate (c)
- char c;
- {
- switch (c) {
- case '.':
- case '?': return period;
- case ',': return comma;
- case ' ': return space;
- case '\n':return newline;
- default:
- if (islower (c))
- return lowercase;
- else
- if (isupper (c))
- return uppercase;
- else
- return invalid;
- }
- }
-
- /*Parse - given the current state, compare the current character
- against the legal choices to select the next state.
- Return a 1 on no error and a 0 on error.*/
- int parse (stateptr, c)
- struct state **stateptr;
- char c;
- {
- unsigned i;
- enum chartype val;
- struct state *localptr;
-
- localptr = *stateptr;
- if (localptr -> signature != marker) {
- printf ("pointer error!\n");
- *stateptr = &start;
- } else {
- val = evaluate (c);
- for (i = 0; i < maxcases; i++)
- if (localptr -> choice [i].value == val) {
- *stateptr = localptr -> choice [i].next;
- return 1;
- }
- }
- *stateptr = localptr -> error;
- return 0;
- }
-
- /*Fixup - forward references are not allowed in data initializations.
- Fixup initializes those values which would generate error
- messages in a data initialization.*/
- void fixup ()
- {
- start.choice[0].next = &normal;
- start.error = &normal;
-
- normal.choice[1].next = &break1;
- normal.choice[2].next = &break2;
- normal.choice[3].next = &end1;
- normal.choice[4].next = &begline;
-
- break2.choice[1].next = &begline;
-
- end1.choice[0].next = &end2;
- }
-
- /*Main - read in strings from STDIN. Parse them against our state
- table grammar rules. Point out any errors detected.*/
- main ()
- {
- char buffer [256], *ptr, mark;
-
- fixup (); /*complete pointer init*/
-
- current = &start;
- while (gets (buffer)) {
- printf ("%s\n", buffer);
- for (ptr = buffer; *ptr; ptr++) {
- if (parse (¤t, *ptr))
- mark = ' ';
- else
- mark = '^';
- printf ("%c", mark);
- }
- parse (¤t, '\n'); /*tack on a carriage return*/
- printf ("\n");
- }
- }