OS/2 Shareware BBS: 10 Tools

home *** CD-ROM | disk | FTP | other *** search

/ OS/2 Shareware BBS: 10 Tools / 10-Tools.zip / pccts1.zip / ANTLR / BITS.C < prev next >

Wrap

C/C++ Source or Header | 1993-09-02 | 11KB | 455 lines

/* * bits.c -- manage creation and output of bit sets used by the parser. * * $Id: bits.c,v 1.8 1993/08/24 14:44:32 pccts Exp pccts $ * $Revision: 1.8 $ * * SOFTWARE RIGHTS * * We reserve no LEGAL rights to the Purdue Compiler Construction Tool * Set (PCCTS) -- PCCTS is in the public domain. An individual or * company may do whatever they wish with source code distributed with * PCCTS or the code generated by PCCTS, including the incorporation of * PCCTS, or its output, into commerical software. * * We encourage users to develop software with PCCTS. However, we do ask * that credit is given to us for developing PCCTS. By "credit", * we mean that if you incorporate our source code into one of your * programs (commercial product, research project, or otherwise) that you * acknowledge this fact somewhere in the documentation, research report, * etc... If you like PCCTS and have developed a nice tool with the * output, please mention that you developed it using PCCTS. In * addition, we ask that this header remain intact in our source code. * As long as these guidelines are kept, we expect to continue enhancing * this system and expect to make other tools available as they are * completed. * * ANTLR 1.10 * Terence Parr * Purdue University * 1989-1993 */ #include <stdio.h> #include <ctype.h> #ifdef __cplusplus #ifndef __STDC__ #define __STDC__ #endif #endif #include "set.h" #include "syn.h" #include "hash.h" #include "generic.h" #include "dlgdef.h" #define BitsPerByte 8 /* #define BitsPerWord BitsPerByte*sizeof(unsigned) */ /* char is only thing that is pretty much always known == 8 bits * This allows output of antlr (set stuff, anyway) to be androgynous (portable) */ typedef unsigned char SetWordType; #define BitsPerWord BitsPerByte*sizeof(SetWordType) static SetWordType *setwd = NULL; int setnum = -1; int wordnum = 0; int esetnum = 0; /* Used to convert native wordsize, which ANTLR uses (via set.c) to manipulate sets, to bytes that are most portable size-wise. */ void #ifdef __STDC__ DumpIntAsChars( FILE *f, char *format, unsigned wd ) #else DumpIntAsChars( f, format, wd ) FILE *f; char *format; unsigned wd; #endif { int i; /* uses max of 32 bit unsigned integer for the moment */ static unsigned long byte_mask[sizeof(unsigned long)] = { 0xFF, 0xFF00, 0xFF0000, 0xFF000000 }; /* 0xFF00000000, 0xFF0000000000, 0xFF000000000000, 0xFF00000000000000 };*/ /* for each byte in the word */ for (i=0; i<sizeof(unsigned); i++) { /* mask out the ith byte and shift down to the first 8 bits */ fprintf(f, format, (wd&byte_mask[i])>>(i*BitsPerByte)); if ( i<sizeof(unsigned)-1) fprintf(f, ","); } } /* Create a new setwd (ignoring [Ep] token on end) */ void #ifdef __STDC__ NewSetWd( void ) #else NewSetWd( ) #endif { SetWordType *p; if ( setwd == NULL ) { setwd = (SetWordType *) calloc(TokenNum, sizeof(SetWordType)); require(setwd!=NULL, "NewSetWd: cannot alloc set wd\n"); } for (p = setwd; p<&(setwd[TokenNum]); p++) {*p=0;} wordnum++; } /* Dump the current setwd to ErrFile. 0..MaxTokenVal */ void #ifdef __STDC__ DumpSetWd( void ) #else DumpSetWd( ) #endif { int i,c=1; if ( setwd==NULL ) return; fprintf(DefFile, "extern SetWordType setwd%d[];\n", wordnum); fprintf(ErrFile, "SetWordType setwd%d[%d] = {", wordnum, TokenNum-1); for (i=0; i<TokenNum-1; i++) { if ( i!=0 ) fprintf(ErrFile, ","); if ( c == 8 ) {fprintf(ErrFile, "\n\t"); c=1;} else c++; fprintf(ErrFile, "0x%x", setwd[i]); } fprintf(ErrFile, "};\n"); } /* Make a new set. Dump old setwd and create new setwd if current setwd is full */ void #ifdef __STDC__ NewSet( void ) #else NewSet( ) #endif { setnum++; if ( setnum==BitsPerWord ) /* is current setwd full? */ { DumpSetWd(); NewSetWd(); setnum = 0; } } /* s is a set of tokens. Turn on bit at each token position in set 'setnum' */ void #ifdef __STDC__ FillSet( set s ) #else FillSet( s ) set s; #endif { SetWordType mask=(((unsigned)1)<<setnum); unsigned int e; while ( !set_nil(s) ) { e = set_int(s); set_rm(e, s); setwd[e] |= mask; } } /* E r r o r C l a s s S t u f f */ /* compute the FIRST of a rule for the error class stuff */ static set #ifdef __STDC__ Efirst( char *rule, ECnode *eclass ) #else Efirst( rule, eclass ) char *rule; ECnode *eclass; #endif { set rk, a; Junction *r; RuleEntry *q = (RuleEntry *) hash_get(Rname, rule); if ( q == NULL ) { warnNoFL(eMsg2("undefined rule '%s' referenced in errclass '%s'; ignored", rule, TokenStr[eclass->tok])); return empty; } r = RulePtr[q->rulenum]; r->end->halt = TRUE; /* don't let reach fall off end of rule here */ rk = empty; REACH(r, 1, &rk, a); r->end->halt = FALSE; return a; } /* * scan the list of tokens/eclasses/nonterminals filling the new eclass * with the set described by the list. Note that an eclass can be * quoted to allow spaces etc... However, an eclass must not conflict * with a reg expr found elsewhere. The reg expr will be taken over * the eclass name. */ static void #ifdef __STDC__ doEclass( char *eclass ) #else doEclass( eclass ) char *eclass; #endif { TermEntry *q; ECnode *p; ListNode *e; unsigned int t; unsigned deg=0; set a; require(eclass!=NULL, "doEclass: NULL eset"); p = (ECnode *) eclass; lexmode(p->lexclass); /* switch to lexclass where errclass is defined */ p->eset = empty; for (e = (p->elist)->next; e!=NULL; e=e->next) { if ( islower( *((char *)e->elem) ) ) /* is it a rule ref? (alias FIRST request) */ { a = Efirst((char *)e->elem, p); set_orin(&p->eset, a); deg += set_deg(a); set_free( a ); continue; } else if ( *((char *)e->elem)=='"' ) { t = 0; q = (TermEntry *) hash_get(Texpr, (char *) e->elem); if ( q == NULL ) { /* if quoted and not an expr look for eclass name */ q = (TermEntry *) hash_get(Tname, *((char **)&(e->elem))=StripQuotes((char *)e->elem)); if ( q != NULL ) t = q->token; } else t = q->token; } else /* labelled token/eclass */ { q = (TermEntry *) hash_get(Tname, (char *)e->elem); if ( q != NULL ) t = q->token; else t=0; } if ( t!=0 ) { set_orel(t, &p->eset); deg++; } else warnNoFL(eMsg2("undefined token '%s' referenced in errclass '%s'; ignored", (char *)e->elem, TokenStr[p->tok])); } p->setdeg = deg; } void #ifdef __STDC__ ComputeErrorSets( void ) #else ComputeErrorSets( ) #endif { #ifdef __cplusplus list_apply(eclasses, (void (*)(void *)) doEclass); #else #ifdef __STDC__ list_apply(eclasses, (void (*)(void *)) doEclass); #else list_apply(eclasses, doEclass); #endif #endif } /* replace a subset of an error set with an error class name if a subset is found * repeat process until no replacements made */ void #ifdef __STDC__ SubstErrorClass( set *f ) #else SubstErrorClass( f ) set *f; #endif { int max, done = 0; ListNode *p; ECnode *ec, *maxclass = NULL; set a; require(f!=NULL, "SubstErrorClass: NULL eset"); if ( eclasses == NULL ) return; while ( !done ) { max = 0; maxclass = NULL; for (p=eclasses->next; p!=NULL; p=p->next) /* chk all error classes */ { ec = (ECnode *) p->elem; if ( ec->setdeg > max ) { if ( set_sub(ec->eset, *f) || set_equ(ec->eset, *f) ) {maxclass = ec; max=ec->setdeg;} } } if ( maxclass != NULL ) /* if subset found, replace with token */ { a = set_dif(*f, maxclass->eset); set_orel((unsigned)maxclass->tok, &a); set_free(*f); *f = a; } else done = 1; } } /* Define a new error set. WARNING...set-implementation dependent */ int #ifdef __STDC__ DefErrSet( set *f ) #else DefErrSet( f ) set *f; #endif { unsigned *p, *endp; int e=1; require(!set_nil(*f), "DefErrSet: nil set to dump?"); SubstErrorClass(f); p = f->setword; endp = &(f->setword[NumWords(TokenNum-1)]); esetnum++; fprintf(DefFile, "extern SetWordType zzerr%d[];\n", esetnum); fprintf(ErrFile, "SetWordType zzerr%d[%d] = {", esetnum, NumWords(TokenNum-1)*sizeof(unsigned)); while ( p < endp ) { if ( e > 1 ) fprintf(ErrFile, ", "); DumpIntAsChars(ErrFile, "0x%x", *p++); if ( e == 3 ) { if ( p < endp ) fprintf(ErrFile, ","); fprintf(ErrFile, "\n\t"); e=1; } else e++; } fprintf(ErrFile, "};\n"); return esetnum; } void #ifdef __STDC__ GenErrHdr( void ) #else GenErrHdr( ) #endif { int i, j; fprintf(ErrFile, "/*\n"); fprintf(ErrFile, " * A n t l r S e t s / E r r o r F i l e H e a d e r\n"); fprintf(ErrFile, " *\n"); fprintf(ErrFile, " * Generated from:"); for (i=0; i<NumFiles; i++) fprintf(ErrFile, " %s", FileStr[i]); fprintf(ErrFile, "\n"); fprintf(ErrFile, " *\n"); fprintf(ErrFile, " * Terence Parr, Will Cohen, and Hank Dietz: 1989-1993\n"); fprintf(ErrFile, " * Purdue University Electrical Engineering\n"); fprintf(ErrFile, " * ANTLR Version %s\n", Version); fprintf(ErrFile, " */\n\n"); fprintf(ErrFile, "#include <stdio.h>\n"); fprintf(ErrFile, "#define ANTLR_VERSION %s\n", VersionDef); if ( strcmp(ParserName, DefaultParserName)!=0 ) fprintf(ErrFile, "#define %s %s\n", DefaultParserName, ParserName); if ( strcmp(ParserName, DefaultParserName)!=0 ) fprintf(ErrFile, "#include \"%s\"\n", RemapFileName); if ( HdrAction != NULL ) dumpAction( HdrAction, ErrFile, 0, -1, 0, 1 ); if ( FoundGuessBlk ) { fprintf(ErrFile, "#define ZZCAN_GUESS\n"); fprintf(ErrFile, "#include <setjmp.h>\n"); } if ( OutputLL_k > 1 ) fprintf(ErrFile, "#define LL_K %d\n", OutputLL_k); fprintf(ErrFile, "#define zzEOF_TOKEN %d\n", EofToken); fprintf(ErrFile, "#define zzSET_SIZE %d\n", NumWords(TokenNum-1)*sizeof(unsigned)); if ( DemandLookahead ) fprintf(ErrFile, "#define DEMAND_LOOK\n"); fprintf(ErrFile, "#include \"antlr.h\"\n"); if ( GenAST ) fprintf(ErrFile, "#include \"ast.h\"\n"); fprintf(ErrFile, "#include \"%s\"\n", DefFileName); fprintf(ErrFile, "#include \"dlgdef.h\"\n"); fprintf(ErrFile, "#include \"err.h\"\n\n"); /* Dump a zztokens for each automaton */ if ( strcmp(ParserName, DefaultParserName)!=0 ) { fprintf(ErrFile, "char *%s_zztokens[%d]={\n", ParserName, TokenNum-1); } else { fprintf(ErrFile, "char *zztokens[%d]={\n", TokenNum-1); } fprintf(ErrFile, "\t/* 00 */\t\"Invalid\",\n"); if ( TokenStr[EofToken] != NULL ) fprintf(ErrFile, "\t/* %02d */\t\"%s\"", EofToken, TokenStr[i]); else fprintf(ErrFile, "\t/* %02d */\t\"EOF\"", EofToken); for (i=TokenStart; i<TokenNum-1; i++) { if ( i == EpToken ) continue; if ( TokenStr[i] != NULL ) fprintf(ErrFile, ",\n\t/* %02d */\t\"%s\"", i, TokenStr[i]); else { /* look in all lexclasses for the reg expr */ for (j=0; j<NumLexClasses; j++) { lexmode(j); if ( ExprStr[i] != NULL ) { fprintf(ErrFile, ",\n\t/* %02d */\t", i); dumpExpr(ExprStr[i]); break; } } require(j<NumLexClasses, eMsgd("No label or expr for token %d",i)); } } fprintf(ErrFile, "\n};\n"); } void #ifdef __STDC__ dumpExpr( char *e ) #else dumpExpr( e ) char *e; #endif { while ( *e!='\0' ) { if ( *e=='\\' && *(e+1)=='\\' ) {putc('\\', ErrFile); putc('\\', ErrFile); e+=2;} else if ( *e=='\\' && *(e+1)=='"' ) {putc('\\', ErrFile); putc('"', ErrFile); e+=2;} else if ( *e=='\\' ) {putc('\\', ErrFile); putc('\\', ErrFile); e++;} else {putc(*e, ErrFile); e++;} } }