ref: 8426988151d94d69a482e6275777d3f7275dbabe
dir: /src/cmd/cc/cc1/cpp.c/
#include <ctype.h> #include <limits.h> #include <stdio.h> #include <stdlib.h> #include <string.h> #include <time.h> #include <scc/cstd.h> #include <scc/scc.h> #include "cc1.h" struct macroctx { char *name; char *argp; char **arglist; char **listp; char *buffer; char *def; size_t bufsiz; int arglen; int npars; }; static unsigned ncmdlines; static Symbol *symline, *symfile; static unsigned char ifstatus[NR_COND]; static int cppoff; static struct items dirinclude; unsigned cppctx; int disexpand; int disescape; void defdefine(char *macro, char *val, char *source) { char *def, *fmt = "#define %s %s\n"; Symbol dummy = {.flags = SDECLARED}; if (!val) val = ""; def = xmalloc(strlen(fmt) + strlen(macro) + strlen(val)); sprintf(def, fmt, macro, val); lineno = ++ncmdlines; addinput(source, &dummy, def, FAIL); cpp(); delinput(); } void undefmacro(char *s) { killsym(lookup(NS_CPP, s, NOALLOC)); } void icpp(void) { static char sdate[14], stime[11]; struct tm *tm; time_t t; static char **bp, *list[] = { "__STDC__", "__STDC_HOSTED__", "__SCC__", NULL }; t = time(NULL); tm = localtime(&t); strftime(sdate, sizeof(sdate), "\"%b %d %Y\"", tm); strftime(stime, sizeof(stime), "\"%H:%M:%S\"", tm); defdefine("__DATE__", sdate, "built-in"); defdefine("__TIME__", stime, "built-in"); defdefine("__STDC_VERSION__", STDC_VERSION, "built-in"); defdefine("__LINE__", NULL, "built-in"); defdefine("__FILE__", NULL, "built-in"); symline = lookup(NS_CPP, "__LINE__", ALLOC); symfile = lookup(NS_CPP, "__FILE__", ALLOC); for (bp = list; *bp; ++bp) defdefine(*bp, "1", "built-in"); ncmdlines = 0; } static void nextcpp(struct macroctx *mp) { next(); if (yytoken == EOFTOK) error("unterminated argument list invoking macro \"%s\"", mp->name); if (yylen + 1 > mp->arglen) error("argument overflow invoking macro \"%s\"", mp->name); if (yytoken == IDEN) yylval.sym->flags |= SUSED; memcpy(mp->argp, yytext, yylen); mp->argp += yylen; mp->arglen -= yylen + 1; *mp->argp++ = ' '; } static void paren(struct macroctx *mp) { for (;;) { nextcpp(mp); switch (yytoken) { case ')': return; case '(': paren(mp); break; } } } static void parameter(struct macroctx *mp) { for (;;) { nextcpp(mp); switch (yytoken) { case ')': case ',': /* remove " , " or " ) "*/ mp->argp -= 3; *mp->argp++ = '\0'; return; case '(': paren(mp); break; } } } static int parsepars(struct macroctx *mp) { int n; if (mp->npars == -1) return -1; if (ahead() != '(' && mp->npars > 0) return 0; next(); n = 0; if (ahead() == ')') { next(); } else { do { *mp->listp++ = mp->argp; parameter(mp); } while (++n < NR_MACROARG && yytoken == ','); } if (yytoken != ')') error("incorrect macro function-alike invocation"); disexpand = 0; if (n == NR_MACROARG) error("too many parameters in macro \"%s\"", mp->name); if (n != mp->npars) { error("macro \"%s\" received %d arguments, but it takes %d", mp->name, n, mp->npars); } return 1; } static size_t copymacro(struct macroctx *mp) { int delim, c, esc; char *s, *p, *arg, *bp; size_t size, bufsiz; bp = mp->buffer; bufsiz = mp->bufsiz; for (s = mp->def; c = *s; ++s) { switch (c) { case '\'': delim = '\''; goto search_delim; case '\"': delim = '"'; search_delim: esc = 0; p = s; for (++s; c = *s; ++s) { if (c == '\\' && !esc) esc = 1; else if (c == delim &&!esc) break; else esc = 0; } size = s - p + 1; if (size > bufsiz) goto expansion_too_long; memcpy(bp, p, size); bufsiz -= size; bp += size; break; case '$': /* token concatenation operator */ while (bp[-1] == ' ') --bp, ++bufsiz; while (s[1] == ' ') ++s; break; case '#': /* stringfier operator */ arg = mp->arglist[atoi(s += 2)]; s += 2; if (bufsiz < 3) goto expansion_too_long; *bp++ = '"'; while ((c = *arg++) != '\0') { if (c == '"') { if (bufsiz < 3) goto expansion_too_long; *bp++ = '\\'; *bp++ = '"'; bufsiz -= 2; } else { if (bufsiz < 2) goto expansion_too_long; *bp++ = c; bufsiz--; } } *bp++ = '"'; break; case '@': /* parameter substitution */ arg = mp->arglist[atoi(++s)]; s += 2; size = strlen(arg); if (size > bufsiz) goto expansion_too_long; memcpy(bp, arg, size); bp += size; bufsiz -= size; break; default: if (bufsiz-- == 0) goto expansion_too_long; *bp++ = c; break; } } *bp = '\0'; return bp - mp->buffer; expansion_too_long: error("macro expansion of \"%s\" too long", mp->name); } int expand(Symbol *sym) { size_t elen; int i; struct macroctx macro; char *arglist[NR_MACROARG]; char arguments[INPUTSIZ], buffer[INPUTSIZ]; DBG("MACRO '%s' detected %d %d", sym->name, disexpand, sym->hide); if (disexpand || sym->hide) return 0; macro.name = sym->name; macro.argp = arguments; macro.listp = arglist; macro.arglist = arglist; macro.arglen = INPUTSIZ; macro.buffer = buffer; macro.npars = atoi(sym->u.s); macro.def = sym->u.s + 3; macro.bufsiz = INPUTSIZ-1; if (sym == symfile) { elen = sprintf(buffer, "\"%s\" ", filenam); goto substitute; } if (sym == symline) { elen = sprintf(buffer, "%d ", lineno); goto substitute; } if (!sym->u.s) return 1; macro.npars = atoi(sym->u.s); if (!parsepars(¯o)) return 0; for (i = 0; i < macro.npars; ++i) DBG("MACRO par%d:%s", i, arglist[i]); elen = copymacro(¯o); substitute: buffer[elen] = '\0'; DBG("MACRO '%s' expanded to :'%s'", macro.name, buffer); addinput(filenam, sym, xstrdup(buffer), FAIL); return 1; } static int getpars(Symbol *args[NR_MACROARG]) { int n, c; Symbol *sym; c = *input->p; next(); if (c != '(') return -1; /* skip the '(' */ next(); if (accept(')')) return 0; n = 0; do { if (n == NR_MACROARG) { cpperror("too many parameters in macro"); return NR_MACROARG; } if (accept(ELLIPSIS)) { args[n++] = NULL; break; } if (yytoken != IDEN) { cpperror("macro arguments must be identifiers"); return NR_MACROARG; } sym = install(NS_IDEN, yylval.sym); sym->flags |= SUSED; args[n++] = sym; next(); } while (accept(',')); expect(')'); return n; } static int getdefs(Symbol *args[NR_MACROARG], int nargs, char *bp, size_t bufsiz) { Symbol **argp; size_t len; int prevc = 0, ispar; if (yytoken == '$') { cpperror("'##' cannot appear at either ends of a macro expansion"); return 0; } for (;;) { ispar = 0; if (yytoken == IDEN && nargs >= 0) { for (argp = args; argp < &args[nargs]; ++argp) { if (*argp == yylval.sym) break; } if (argp != &args[nargs]) { sprintf(yytext, "@%02d@", (int) (argp - args)); ispar = 1; } } if (prevc == '#' && !ispar) { cpperror("'#' is not followed by a macro parameter"); return 0; } if (yytoken == '\n') break; if ((len = strlen(yytext)) >= bufsiz) { cpperror("macro too long"); return 0; } /* $ token is generated by ## */ if (yytoken == '$') { *bp++ = '$'; --bufsiz; } else { memcpy(bp, yytext, len); bp += len; bufsiz -= len; } if ((prevc = yytoken) != '#') { *bp++ = ' '; --bufsiz; } next(); } *bp = '\0'; return 1; } static void define(void) { Symbol *sym,*args[NR_MACROARG]; char buff[LINESIZ+1]; int n; if (cppoff) return; disescape = 1; namespace = NS_CPP; next(); if (yytoken != IDEN) { cpperror("macro names must be identifiers"); return; } sym = yylval.sym; if (sym->flags & SDECLARED) { warn("'%s' redefined", yytext); free(sym->u.s); } else { sym = install(NS_CPP, sym); sym->flags |= SDECLARED|SSTRING; } namespace = NS_IDEN; /* Avoid polution in NS_CPP */ if ((n = getpars(args)) == NR_MACROARG) goto delete; if (n > 0 && !args[n-1]) /* it is a variadic function */ --n; sprintf(buff, "%02d#", n); if (!getdefs(args, n, buff+3, LINESIZ-3)) goto delete; sym->u.s = xstrdup(buff); DBG("MACRO '%s' defined as '%s'", sym->name, buff); return; delete: killsym(sym); } void incdir(char *dir) { if (!dir || *dir == '\0') die("cc1: incorrect -I flag"); newitem(&dirinclude, dir); } static int includefile(char *dir, char *file, size_t filelen) { size_t dirlen; char path[FILENAME_MAX]; if (!dir) { dirlen = 0; if (filelen > FILENAME_MAX-1) return 0; } else { dirlen = strlen(dir); if (dirlen + filelen > FILENAME_MAX-2) return 0; memcpy(path, dir, dirlen); if (dir[dirlen-1] != '/') path[dirlen++] = '/'; } memcpy(path+dirlen, file, filelen); path[dirlen + filelen] = '\0'; return addinput(path, NULL, NULL, NOFAIL); } static char * cwd(char *buf) { char *p, *s = filenam; size_t len; if ((p = strrchr(s, '/')) == NULL) return NULL; if ((len = p - s) >= FILENAME_MAX) die("cc1: current work directory too long"); memcpy(buf, s, len); buf[len] = '\0'; return buf; } static void include(void) { char dir[FILENAME_MAX], file[FILENAME_MAX], *p, **bp; size_t filelen; int n; if (cppoff) return; disexpand = 0; namespace = NS_IDEN; next(); switch (*yytext) { case '<': if ((p = strchr(input->begin, '>')) == NULL || p[-1] == '<') goto bad_include; filelen = p - input->begin; if (filelen >= FILENAME_MAX) goto too_long; memcpy(file, input->begin, filelen); file[filelen] = '\0'; input->begin = input->p = p+1; if (next() != '\n') goto trailing_characters; break; case '"': if (yylen < 3) goto bad_include; filelen = yylen-2; if (filelen >= FILENAME_MAX) goto too_long; memcpy(file, yytext+1, filelen); file[filelen] = '\0'; if (next() != '\n') goto trailing_characters; if (includefile(cwd(dir), file, filelen)) goto its_done; break; default: goto bad_include; } n = dirinclude.n; for (bp = dirinclude.s; n--; ++bp) { if (includefile(*bp, file, filelen)) goto its_done; } cpperror("included file '%s' not found", file); its_done: return; trailing_characters: cpperror("trailing characters after preprocessor directive"); return; too_long: cpperror("too long file name in #include"); return; bad_include: cpperror("#include expects \"FILENAME\" or <FILENAME>"); return; } static void line(void) { long n; char *endp, *fname; if (cppoff) return; disexpand = 0; next(); n = strtol(yytext, &endp, 10); if (n <= 0 || n > USHRT_MAX || *endp != '\0') { cpperror("first parameter of #line is not a positive integer"); return; } next(); if (yytoken == '\n') { fname = NULL; } else { if (*yytext != '\"' || yylen == 1) { cpperror("second parameter of #line is not a valid filename"); return; } fname = yylval.sym->u.s; } setloc(fname, n - 1); if (yytoken != '\n') next(); } static void pragma(void) { if (cppoff) return; next(); warn("ignoring pragma '%s'", yytext); *input->p = '\0'; next(); } static void usererr(void) { if (cppoff) return; cpperror("#error %s", input->p); *input->p = '\0'; next(); } static void ifclause(int negate, int isifdef) { Symbol *sym; unsigned n; int status; Node *expr; if (cppctx == NR_COND-1) error("too many nesting levels of conditional inclusion"); n = cppctx++; namespace = NS_CPP; next(); if (isifdef) { if (yytoken != IDEN) { cpperror("no macro name given in #%s directive", (negate) ? "ifndef" : "ifdef"); return; } sym = yylval.sym; next(); status = (sym->flags & SDECLARED) != 0; if (!status) killsym(sym); } else { /* TODO: catch recovery here */ if ((expr = constexpr()) == NULL) { cpperror("parameter of #if is not an integer constant expression"); return; } status = expr->sym->u.i != 0; freetree(expr); } if (negate) status = !status; if ((ifstatus[n] = status) == 0) ++cppoff; } static void cppif(void) { disexpand = 0; ifclause(0, 0); } static void ifdef(void) { ifclause(0, 1); } static void ifndef(void) { ifclause(1, 1); } static void elseclause(void) { int status; if (cppctx == 0) { cpperror("#else without #ifdef/ifndef"); return; } status = ifstatus[cppctx-1]; ifstatus[cppctx-1] = !status; cppoff += (status) ? 1 : -1; } static void cppelse(void) { elseclause(); next(); } static void elif(void) { elseclause(); if (ifstatus[cppctx-1]) { --cppctx; cppif(); } } static void endif(void) { if (cppctx == 0) error("#endif without #if"); if (!ifstatus[--cppctx]) --cppoff; next(); } static void undef(void) { if (cppoff) return; namespace = NS_CPP; next(); if (yytoken != IDEN) { error("no macro name given in #undef directive"); return; } killsym(yylval.sym); next(); } int cpp(void) { static struct { unsigned char token; void (*fun)(void); } *bp, clauses [] = { {DEFINE, define}, {INCLUDE, include}, {LINE, line}, {IFDEF, ifdef}, {IF, cppif}, {ELIF, elif}, {IFNDEF, ifndef}, {ELSE, cppelse}, {ENDIF, endif}, {UNDEF, undef}, {PRAGMA, pragma}, {ERROR, usererr}, {0, NULL} }; int ns; char *p; for (p = input->p; isspace(*p); ++p) ; if (*p != '#') return cppoff; input->p = p+1; disexpand = 1; lexmode = CPPMODE; ns = namespace; namespace = NS_CPPCLAUSES; next(); namespace = NS_IDEN; if (yytoken == '\n') goto ret; for (bp = clauses; bp->token && bp->token != yytoken; ++bp) ; if (!bp->token) { errorp("incorrect preprocessor directive '%s'", yytext); goto ret; } DBG("CPP %s", yytext); pushctx(); /* create a new context to avoid polish */ (*bp->fun)(); /* the current context, and to get all */ popctx(); /* the symbols freed at the end */ /* * #include changes the content of input->line, so the correctness * of the line must be checked in the own include(), and we have * to skip this tests. For the same reason include() is the only * function which does not prepare the next token */ if (yytoken != '\n' && !cppoff && bp->token != INCLUDE) errorp("trailing characters after preprocessor directive"); ret: disescape = 0; disexpand = 0; lexmode = CCMODE; namespace = ns; return 1; } void ppragmaln(void) { static char file[FILENAME_MAX]; static unsigned nline; char *s; putchar('\n'); if (strcmp(file, filenam)) { strcpy(file, filenam); s = "#line %u \"%s\"\n"; } else if (nline+1 != lineno) { s = "#line %u\n"; } else { s = ""; } nline = lineno; printf(s, nline, file); } void outcpp(void) { int c; char *s, *t; for (next(); yytoken != EOFTOK; next()) { if (onlyheader) continue; if (yytoken != STRING) { printf("%s ", yytext); continue; } for (s = yytext; (c = *s) != '\0'; ++s) { switch (c) { case '\n': t = "\\n"; goto print_str; case '\v': t = "\\v"; goto print_str; case '\b': t = "\\b"; goto print_str; case '\t': t = "\\t"; goto print_str; case '\a': t = "\\a"; goto print_str; case '\f': t = "\\f"; goto print_str; case '\r': t = "\\r"; goto print_str; case '"': if (s == yytext || s[1] == '\0') goto print_chr; t = "\\\""; goto print_str; case '\'': t = "\\'"; goto print_str; case '\?': t = "\\\?"; goto print_str; case '\\': putchar('\\'); default: print_chr: if (!isprint(c)) printf("\\x%x", c); else putchar(c); break; print_str: fputs(t, stdout); break; } } putchar(' '); } putchar('\n'); }