/* CPP main program, using CPP Library. Copyright (C) 1995, 1997, 1998, 1999, 2000, 2001 Free Software Foundation, Inc. Written by Per Bothner, 1994-95. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. In other words, you are welcome to use, share and improve this program. You are forbidden to forbid anyone else to use, share and improve what you give them. Help stamp out software-hoarding! */ #include "config.h" #include "system.h" #include "cpplib.h" #include "intl.h" /* Encapsulates state used to convert the stream of tokens coming from cpp_get_token back into a text file. */ struct printer { FILE *outf; /* stream to write to. */ const char *last_fname; /* previous file name. */ const char *syshdr_flags; /* system header flags, if any. */ unsigned int lineno; /* line currently being written. */ unsigned char printed; /* nonzero if something output at lineno. */ }; int main PARAMS ((int, char **)); static void general_init PARAMS ((const char *)); static void do_preprocessing PARAMS ((int, char **)); static void setup_callbacks PARAMS ((void)); /* General output routines. */ static void scan_buffer PARAMS ((cpp_reader *)); static void check_multiline_token PARAMS ((cpp_string *)); static int printer_init PARAMS ((cpp_reader *)); static int dump_macro PARAMS ((cpp_reader *, cpp_hashnode *, void *)); static void print_line PARAMS ((const char *)); static void maybe_print_line PARAMS ((unsigned int)); /* Callback routines for the parser. Most of these are active only in specific modes. */ static void cb_define PARAMS ((cpp_reader *, cpp_hashnode *)); static void cb_undef PARAMS ((cpp_reader *, cpp_hashnode *)); static void cb_include PARAMS ((cpp_reader *, const unsigned char *, const cpp_token *)); static void cb_ident PARAMS ((cpp_reader *, const cpp_string *)); static void cb_file_change PARAMS ((cpp_reader *, const cpp_file_change *)); static void cb_def_pragma PARAMS ((cpp_reader *)); const char *progname; /* Needs to be global. */ static cpp_reader *pfile; /* An opaque handle. */ static cpp_options *options; /* Options of pfile. */ static struct printer print; int main (argc, argv) int argc; char **argv; { general_init (argv[0]); /* Contruct a reader with default language GNU C89. */ pfile = cpp_create_reader (CLK_GNUC89); options = cpp_get_options (pfile); do_preprocessing (argc, argv); /* Call to cpp_destroy () omitted for performance reasons. */ if (cpp_errors (pfile)) return FATAL_EXIT_CODE; return SUCCESS_EXIT_CODE; } /* Store the program name, and set the locale. */ static void general_init (argv0) const char *argv0; { progname = argv0 + strlen (argv0); while (progname != argv0 && ! IS_DIR_SEPARATOR (progname[-1])) --progname; xmalloc_set_program_name (progname); /* LC_CTYPE determines the character set used by the terminal so it has to be set to output messages correctly. */ #ifdef HAVE_LC_MESSAGES setlocale (LC_CTYPE, ""); setlocale (LC_MESSAGES, ""); #else setlocale (LC_ALL, ""); #endif (void) bindtextdomain (PACKAGE, localedir); (void) textdomain (PACKAGE); } /* Handle switches, preprocess and output. */ static void do_preprocessing (argc, argv) int argc; char **argv; { int argi = 1; /* Next argument to handle. */ argi += cpp_handle_options (pfile, argc - argi , argv + argi); if (CPP_FATAL_ERRORS (pfile)) return; if (argi < argc) cpp_fatal (pfile, "Invalid option %s", argv[argi]); else cpp_post_options (pfile); if (CPP_FATAL_ERRORS (pfile)) return; /* If cpp_handle_options saw --help or --version on the command line, it will have set pfile->help_only to indicate this. Exit successfully. [The library does not exit itself, because e.g. cc1 needs to print its own --help message at this point.] */ if (options->help_only) return; /* Open the output now. We must do so even if no_output is on, because there may be other output than from the actual preprocessing (e.g. from -dM). */ if (printer_init (pfile)) return; setup_callbacks (); if (cpp_start_read (pfile, options->in_fname)) { /* A successful cpp_start_read guarantees that we can call cpp_scan_buffer_nooutput or cpp_get_token next. */ if (options->no_output) cpp_scan_buffer_nooutput (pfile, 1); else scan_buffer (pfile); /* -dM command line option. Should this be in cpp_finish? */ if (options->dump_macros == dump_only) cpp_forall_identifiers (pfile, dump_macro, NULL); cpp_finish (pfile); } /* Flush any pending output. */ if (print.printed) putc ('\n', print.outf); if (ferror (print.outf) || fclose (print.outf)) cpp_notice_from_errno (pfile, options->out_fname); } /* Set up the callbacks as appropriate. */ static void setup_callbacks () { cpp_callbacks *cb = cpp_get_callbacks (pfile); if (! options->no_output) { cb->ident = cb_ident; cb->def_pragma = cb_def_pragma; if (! options->no_line_commands) cb->file_change = cb_file_change; } if (options->dump_includes) cb->include = cb_include; if (options->dump_macros == dump_names || options->dump_macros == dump_definitions) { cb->define = cb_define; cb->undef = cb_undef; cb->poison = cb_def_pragma; } } /* Writes out the preprocessed file. Alternates between two tokens, so that we can avoid accidental token pasting. */ static void scan_buffer (pfile) cpp_reader *pfile; { unsigned int index, line; cpp_token tokens[2], *token; do { for (index = 0;; index = 1 - index) { token = &tokens[index]; cpp_get_token (pfile, token); if (token->type == CPP_EOF) break; line = cpp_get_line (pfile)->output_line; if (print.lineno != line) { unsigned int col = cpp_get_line (pfile)->col; /* Supply enough whitespace to put this token in its original column. Don't bother trying to reconstruct tabs; we can't get it right in general, and nothing ought to care. (Yes, some things do care; the fault lies with them.) */ maybe_print_line (line); if (col > 1) { if (token->flags & PREV_WHITE) col--; while (--col) putc (' ', print.outf); } } else if ((token->flags & (PREV_WHITE | AVOID_LPASTE)) == AVOID_LPASTE && cpp_avoid_paste (pfile, &tokens[1 - index], token)) token->flags |= PREV_WHITE; /* Special case '# ': insert a space between the # and the token. This will prevent it from being treated as a directive when this code is re-preprocessed. XXX Should do this only at the beginning of a line, but how? */ else if (token->type == CPP_NAME && token->val.node->directive_index && tokens[1 - index].type == CPP_HASH) token->flags |= PREV_WHITE; cpp_output_token (token, print.outf); print.printed = 1; if (token->type == CPP_STRING || token->type == CPP_WSTRING || token->type == CPP_COMMENT) check_multiline_token (&token->val.str); } } while (cpp_pop_buffer (pfile) != 0); } /* Adjust print.lineno for newlines embedded in tokens. */ static void check_multiline_token (str) cpp_string *str; { unsigned int i; for (i = 0; i < str->len; i++) if (str->text[i] == '\n') print.lineno++; } /* Initialize a cpp_printer structure. As a side effect, open the output file. */ static int printer_init (pfile) cpp_reader *pfile; { print.last_fname = 0; print.lineno = 0; print.printed = 0; if (options->out_fname[0] == '\0') print.outf = stdout; else { print.outf = fopen (options->out_fname, "w"); if (! print.outf) { cpp_notice_from_errno (pfile, options->out_fname); return 1; } } return 0; } /* Newline-terminate any output line currently in progress. If appropriate, write the current line number to the output, or pad with newlines so the output line matches the current line. */ static void maybe_print_line (line) unsigned int line; { /* End the previous line of text (probably only needed until we get multi-line tokens fixed). */ if (print.printed) { putc ('\n', print.outf); print.lineno++; print.printed = 0; } if (options->no_line_commands) { print.lineno = line; return; } /* print.lineno is zero if this is the first token of the file. We handle this specially, so that a first line of "# 1 "foo.c" in file foo.i outputs just the foo.c line, and not a foo.i line. */ if (line >= print.lineno && line < print.lineno + 8 && print.lineno) { while (line > print.lineno) { putc ('\n', print.outf); print.lineno++; } } else { print.lineno = line; print_line (""); } } static void print_line (special_flags) const char *special_flags; { /* End any previous line of text. */ if (print.printed) putc ('\n', print.outf); print.printed = 0; fprintf (print.outf, "# %u \"%s\"%s%s\n", print.lineno, print.last_fname, special_flags, print.syshdr_flags); } /* Callbacks. */ static void cb_ident (pfile, str) cpp_reader *pfile ATTRIBUTE_UNUSED; const cpp_string * str; { maybe_print_line (cpp_get_line (pfile)->output_line); fprintf (print.outf, "#ident \"%s\"\n", str->text); print.lineno++; } static void cb_define (pfile, node) cpp_reader *pfile; cpp_hashnode *node; { maybe_print_line (cpp_get_line (pfile)->output_line); fprintf (print.outf, "#define %s", NODE_NAME (node)); /* -dD command line option. */ if (options->dump_macros == dump_definitions) fputs ((const char *) cpp_macro_definition (pfile, node), print.outf); putc ('\n', print.outf); print.lineno++; } static void cb_undef (pfile, node) cpp_reader *pfile; cpp_hashnode *node; { maybe_print_line (cpp_get_line (pfile)->output_line); fprintf (print.outf, "#undef %s\n", NODE_NAME (node)); print.lineno++; } static void cb_include (pfile, dir, header) cpp_reader *pfile ATTRIBUTE_UNUSED; const unsigned char *dir; const cpp_token *header; { maybe_print_line (cpp_get_line (pfile)->output_line); fprintf (print.outf, "#%s %s\n", dir, cpp_token_as_text (pfile, header)); print.lineno++; } static void cb_file_change (pfile, fc) cpp_reader *pfile ATTRIBUTE_UNUSED; const cpp_file_change *fc; { /* Bring current file to correct line (except first file). */ if (fc->reason == FC_ENTER && fc->from.filename) maybe_print_line (fc->from.lineno); print.last_fname = fc->to.filename; if (fc->externc) print.syshdr_flags = " 3 4"; else if (fc->sysp) print.syshdr_flags = " 3"; else print.syshdr_flags = ""; if (print.lineno) { const char *flags = ""; print.lineno = fc->to.lineno; if (fc->reason == FC_ENTER) flags = " 1"; else if (fc->reason == FC_LEAVE) flags = " 2"; if (! options->no_line_commands) print_line (flags); } } static void cb_def_pragma (pfile) cpp_reader *pfile; { maybe_print_line (cpp_get_line (pfile)->output_line); fputs ("#pragma ", print.outf); cpp_output_line (pfile, print.outf); print.lineno++; } /* Dump out the hash table. */ static int dump_macro (pfile, node, v) cpp_reader *pfile; cpp_hashnode *node; void *v ATTRIBUTE_UNUSED; { if (node->type == NT_MACRO && !(node->flags & NODE_BUILTIN)) { fprintf (print.outf, "#define %s", NODE_NAME (node)); fputs ((const char *) cpp_macro_definition (pfile, node), print.outf); putc ('\n', print.outf); print.lineno++; } return 1; }