/* The Netwide Assembler main program module * * The Netwide Assembler is copyright (C) 1996 Simon Tatham and * Julian Hall. All rights reserved. The software is * redistributable under the licence given in the file "Licence" * distributed in the NASM archive. */ #include "compiler.h" #include #include #include #include #include #include #include #include "nasm.h" #include "nasmlib.h" #include "float.h" #include "stdscan.h" #include "insns.h" #include "preproc.h" #include "parser.h" #include "eval.h" #include "assemble.h" #include "labels.h" #include "outform.h" #include "listing.h" struct forwrefinfo { /* info held on forward refs. */ int lineno; int operand; }; static int get_bits(char *value); static uint32_t get_cpu(char *cpu_str); static void parse_cmdline(int, char **); static void assemble_file(char *); static void register_output_formats(void); static void report_error_gnu(int severity, const char *fmt, ...); static void report_error_vc(int severity, const char *fmt, ...); static void report_error_common(int severity, const char *fmt, va_list args); static int is_suppressed_warning(int severity); static void usage(void); static efunc report_error; static int using_debug_info, opt_verbose_info; bool tasm_compatible_mode = false; int pass0; int maxbits = 0; int globalrel = 0; static char inname[FILENAME_MAX]; static char outname[FILENAME_MAX]; static char listname[FILENAME_MAX]; static char errname[FILENAME_MAX]; static int globallineno; /* for forward-reference tracking */ /* static int pass = 0; */ static struct ofmt *ofmt = NULL; static FILE *error_file; /* Where to write error messages */ static FILE *ofile = NULL; int optimizing = -1; /* number of optimization passes to take */ static int sb, cmd_sb = 16; /* by default */ static uint32_t cmd_cpu = IF_PLEVEL; /* highest level by default */ static uint32_t cpu = IF_PLEVEL; /* passed to insn_size & assemble.c */ bool global_offset_changed; /* referenced in labels.c */ static struct location location; int in_abs_seg; /* Flag we are in ABSOLUTE seg */ int32_t abs_seg; /* ABSOLUTE segment basis */ int32_t abs_offset; /* ABSOLUTE offset */ static struct RAA *offsets; static struct SAA *forwrefs; /* keep track of forward references */ static const struct forwrefinfo *forwref; static Preproc *preproc; enum op_type { op_normal, /* Preprocess and assemble */ op_preprocess, /* Preprocess only */ op_depend, /* Generate dependencies */ op_depend_missing_ok, /* Generate dependencies, missing OK */ }; static enum op_type operating_mode; /* * Which of the suppressible warnings are suppressed. Entry zero * isn't an actual warning, but it used for -w+error/-Werror. */ static bool suppressed[ERR_WARN_MAX+1] = { true, false, true, false, false, true, false, true, true, false }; /* * The option names for the suppressible warnings. As before, entry * zero does nothing. */ static const char *suppressed_names[ERR_WARN_MAX+1] = { "error", "macro-params", "macro-selfref", "orphan-labels", "number-overflow", "gnu-elf-extensions", "float-overflow", "float-denorm", "float-underflow", "float-toolong" }; /* * The explanations for the suppressible warnings. As before, entry * zero does nothing. */ static const char *suppressed_what[ERR_WARN_MAX+1] = { "treat warnings as errors", "macro calls with wrong parameter count", "cyclic macro references", "labels alone on lines without trailing `:'", "numeric constants does not fit in 64 bits", "using 8- or 16-bit relocation in ELF32, a GNU extension", "floating point overflow", "floating point denormal", "floating point underflow", "too many digits in floating-point number" }; /* * This is a null preprocessor which just copies lines from input * to output. It's used when someone explicitly requests that NASM * not preprocess their source file. */ static void no_pp_reset(char *, int, efunc, evalfunc, ListGen *); static char *no_pp_getline(void); static void no_pp_cleanup(int); static Preproc no_pp = { no_pp_reset, no_pp_getline, no_pp_cleanup }; /* * get/set current offset... */ #define GET_CURR_OFFS (in_abs_seg?abs_offset:\ raa_read(offsets,location.segment)) #define SET_CURR_OFFS(x) (in_abs_seg?(void)(abs_offset=(x)):\ (void)(offsets=raa_write(offsets,location.segment,(x)))) static int want_usage; static int terminate_after_phase; int user_nolist = 0; /* fbk 9/2/00 */ static void nasm_fputs(const char *line, FILE * outfile) { if (outfile) { fputs(line, outfile); putc('\n', outfile); } else puts(line); } int main(int argc, char **argv) { pass0 = 1; want_usage = terminate_after_phase = false; report_error = report_error_gnu; error_file = stderr; nasm_set_malloc_error(report_error); offsets = raa_init(); forwrefs = saa_init((int32_t)sizeof(struct forwrefinfo)); preproc = &nasmpp; operating_mode = op_normal; seg_init(); register_output_formats(); parse_cmdline(argc, argv); if (terminate_after_phase) { if (want_usage) usage(); return 1; } /* If debugging info is disabled, suppress any debug calls */ if (!using_debug_info) ofmt->current_dfmt = &null_debug_form; if (ofmt->stdmac) pp_extra_stdmac(ofmt->stdmac); parser_global_info(ofmt, &location); eval_global_info(ofmt, lookup_label, &location); /* define some macros dependent of command-line */ { char temp[64]; snprintf(temp, sizeof(temp), "__OUTPUT_FORMAT__=%s\n", ofmt->shortname); pp_pre_define(temp); } switch (operating_mode) { case op_depend_missing_ok: pp_include_path(NULL); /* "assume generated" */ /* fall through */ case op_depend: { char *line; preproc->reset(inname, 0, report_error, evaluate, &nasmlist); if (outname[0] == '\0') ofmt->filename(inname, outname, report_error); ofile = NULL; fprintf(stdout, "%s: %s", outname, inname); while ((line = preproc->getline())) nasm_free(line); preproc->cleanup(0); putc('\n', stdout); } break; case op_preprocess: { char *line; char *file_name = NULL; int32_t prior_linnum = 0; int lineinc = 0; if (*outname) { ofile = fopen(outname, "w"); if (!ofile) report_error(ERR_FATAL | ERR_NOFILE, "unable to open output file `%s'", outname); } else ofile = NULL; location.known = false; /* pass = 1; */ preproc->reset(inname, 2, report_error, evaluate, &nasmlist); while ((line = preproc->getline())) { /* * We generate %line directives if needed for later programs */ int32_t linnum = prior_linnum += lineinc; int altline = src_get(&linnum, &file_name); if (altline) { if (altline == 1 && lineinc == 1) nasm_fputs("", ofile); else { lineinc = (altline != -1 || lineinc != 1); fprintf(ofile ? ofile : stdout, "%%line %"PRId32"+%d %s\n", linnum, lineinc, file_name); } prior_linnum = linnum; } nasm_fputs(line, ofile); nasm_free(line); } nasm_free(file_name); preproc->cleanup(0); if (ofile) fclose(ofile); if (ofile && terminate_after_phase) remove(outname); } break; case op_normal: { /* * We must call ofmt->filename _anyway_, even if the user * has specified their own output file, because some * formats (eg OBJ and COFF) use ofmt->filename to find out * the name of the input file and then put that inside the * file. */ ofmt->filename(inname, outname, report_error); ofile = fopen(outname, "wb"); if (!ofile) { report_error(ERR_FATAL | ERR_NOFILE, "unable to open output file `%s'", outname); } /* * We must call init_labels() before ofmt->init() since * some object formats will want to define labels in their * init routines. (eg OS/2 defines the FLAT group) */ init_labels(); ofmt->init(ofile, report_error, define_label, evaluate); assemble_file(inname); if (!terminate_after_phase) { ofmt->cleanup(using_debug_info); cleanup_labels(); } else { /* * We had an fclose on the output file here, but we * actually do that in all the object file drivers as well, * so we're leaving out the one here. * fclose (ofile); */ remove(outname); if (listname[0]) remove(listname); } } break; } if (want_usage) usage(); raa_free(offsets); saa_free(forwrefs); eval_cleanup(); stdscan_cleanup(); if (terminate_after_phase) return 1; else return 0; } /* * Get a parameter for a command line option. * First arg must be in the form of e.g. -f... */ static char *get_param(char *p, char *q, bool *advance) { *advance = false; if (p[2]) { /* the parameter's in the option */ p += 2; while (isspace(*p)) p++; return p; } if (q && q[0]) { *advance = true; return q; } report_error(ERR_NONFATAL | ERR_NOFILE | ERR_USAGE, "option `-%c' requires an argument", p[1]); return NULL; } /* * Copy a filename */ static void copy_filename(char *dst, const char *src) { size_t len = strlen(src); if (len >= (size_t)FILENAME_MAX) { report_error(ERR_FATAL | ERR_NOFILE, "file name too long"); return; } strncpy(dst, src, FILENAME_MAX); } struct textargs { const char *label; int value; }; #define OPT_PREFIX 0 #define OPT_POSTFIX 1 struct textargs textopts[] = { {"prefix", OPT_PREFIX}, {"postfix", OPT_POSTFIX}, {NULL, 0} }; static bool stopoptions = false; static bool process_arg(char *p, char *q) { char *param; int i; bool advance = false; bool suppress; if (!p || !p[0]) return false; if (p[0] == '-' && !stopoptions) { if (strchr("oOfpPdDiIlFXuUZwW", p[1])) { /* These parameters take values */ if (!(param = get_param(p, q, &advance))) return advance; } switch (p[1]) { case 's': error_file = stdout; break; case 'o': /* output file */ copy_filename(outname, param); break; case 'f': /* output format */ ofmt = ofmt_find(param); if (!ofmt) { report_error(ERR_FATAL | ERR_NOFILE | ERR_USAGE, "unrecognised output format `%s' - " "use -hf for a list", param); } else { ofmt->current_dfmt = ofmt->debug_formats[0]; } break; case 'O': /* Optimization level */ { int opt; if (!*param) { /* Naked -O == -Ox */ optimizing = INT_MAX >> 1; /* Almost unlimited */ } else { while (*param) { switch (*param) { case '0': case '1': case '2': case '3': case '4': case '5': case '6': case '7': case '8': case '9': opt = strtoul(param, ¶m, 10); /* -O0 -> optimizing == -1, 0.98 behaviour */ /* -O1 -> optimizing == 0, 0.98.09 behaviour */ if (opt < 2) optimizing = opt - 1; else if (opt <= 5) /* The optimizer seems to have problems with < 5 passes? Hidden bug? */ optimizing = 5; /* 5 passes */ else optimizing = opt; /* More than 5 passes */ break; case 'v': case '+': param++; opt_verbose_info = true; break; case 'x': param++; optimizing = INT_MAX >> 1; /* Almost unlimited */ break; default: report_error(ERR_FATAL, "unknown optimization option -O%c\n", *param); break; } } } break; } case 'p': /* pre-include */ case 'P': pp_pre_include(param); break; case 'd': /* pre-define */ case 'D': pp_pre_define(param); break; case 'u': /* un-define */ case 'U': pp_pre_undefine(param); break; case 'i': /* include search path */ case 'I': pp_include_path(param); break; case 'l': /* listing file */ copy_filename(listname, param); break; case 'Z': /* error messages file */ strcpy(errname, param); break; case 'F': /* specify debug format */ ofmt->current_dfmt = dfmt_find(ofmt, param); if (!ofmt->current_dfmt) { report_error(ERR_FATAL | ERR_NOFILE | ERR_USAGE, "unrecognized debug format `%s' for" " output format `%s'", param, ofmt->shortname); } break; case 'X': /* specify error reporting format */ if (nasm_stricmp("vc", param) == 0) report_error = report_error_vc; else if (nasm_stricmp("gnu", param) == 0) report_error = report_error_gnu; else report_error(ERR_FATAL | ERR_NOFILE | ERR_USAGE, "unrecognized error reporting format `%s'", param); break; case 'g': using_debug_info = true; break; case 'h': printf ("usage: nasm [-@ response file] [-o outfile] [-f format] " "[-l listfile]\n" " [options...] [--] filename\n" " or nasm -v for version info\n\n" " -t assemble in SciTech TASM compatible mode\n" " -g generate debug information in selected format.\n"); printf (" -E (or -e) preprocess only (writes output to stdout by default)\n" " -a don't preprocess (assemble only)\n" " -M generate Makefile dependencies on stdout\n" " -MG d:o, missing files assumed generated\n\n" " -Z redirect error messages to file\n" " -s redirect error messages to stdout\n\n" " -F format select a debugging format\n\n" " -I adds a pathname to the include file path\n"); printf (" -O optimize branch offsets (-O0 disables, default)\n" " -P pre-includes a file\n" " -D[=] pre-defines a macro\n" " -U undefines a macro\n" " -X specifies error reporting format (gnu or vc)\n" " -w+foo enables warning foo (equiv. -Wfoo)\n" " -w-foo disable warning foo (equiv. -Wno-foo)\n" "Warnings:\n"); for (i = 0; i <= ERR_WARN_MAX; i++) printf(" %-23s %s (default %s)\n", suppressed_names[i], suppressed_what[i], suppressed[i] ? "off" : "on"); printf ("\nresponse files should contain command line parameters" ", one per line.\n"); if (p[2] == 'f') { printf("\nvalid output formats for -f are" " (`*' denotes default):\n"); ofmt_list(ofmt, stdout); } else { printf("\nFor a list of valid output formats, use -hf.\n"); printf("For a list of debug formats, use -f
-y.\n"); } exit(0); /* never need usage message here */ break; case 'y': printf("\nvalid debug formats for '%s' output format are" " ('*' denotes default):\n", ofmt->shortname); dfmt_list(ofmt, stdout); exit(0); break; case 't': tasm_compatible_mode = true; break; case 'v': { const char *nasm_version_string = "NASM version " NASM_VER " compiled on " __DATE__ #ifdef DEBUG " with -DDEBUG" #endif ; puts(nasm_version_string); exit(0); /* never need usage message here */ } break; case 'e': /* preprocess only */ case 'E': operating_mode = op_preprocess; break; case 'a': /* assemble only - don't preprocess */ preproc = &no_pp; break; case 'W': if (param[0] == 'n' && param[1] == 'o' && param[2] == '-') { suppress = true; param += 3; } else { suppress = false; } goto set_warning; case 'w': if (param[0] != '+' && param[0] != '-') { report_error(ERR_NONFATAL | ERR_NOFILE | ERR_USAGE, "invalid option to `-w'"); break; } suppress = (param[0] == '-'); param++; goto set_warning; set_warning: for (i = 0; i <= ERR_WARN_MAX; i++) if (!nasm_stricmp(param, suppressed_names[i])) break; if (i <= ERR_WARN_MAX) suppressed[i] = suppress; else if (!nasm_stricmp(param, "all")) for (i = 1; i <= ERR_WARN_MAX; i++) suppressed[i] = suppress; else if (!nasm_stricmp(param, "none")) for (i = 1; i <= ERR_WARN_MAX; i++) suppressed[i] = !suppress; else report_error(ERR_NONFATAL | ERR_NOFILE | ERR_USAGE, "invalid warning `%s'", param); break; case 'M': operating_mode = p[2] == 'G' ? op_depend_missing_ok : op_depend; break; case '-': { int s; if (p[2] == 0) { /* -- => stop processing options */ stopoptions = 1; break; } for (s = 0; textopts[s].label; s++) { if (!nasm_stricmp(p + 2, textopts[s].label)) { break; } } switch (s) { case OPT_PREFIX: case OPT_POSTFIX: { if (!q) { report_error(ERR_NONFATAL | ERR_NOFILE | ERR_USAGE, "option `--%s' requires an argument", p + 2); break; } else { advance = 1, param = q; } if (s == OPT_PREFIX) { strncpy(lprefix, param, PREFIX_MAX - 1); lprefix[PREFIX_MAX - 1] = 0; break; } if (s == OPT_POSTFIX) { strncpy(lpostfix, param, POSTFIX_MAX - 1); lpostfix[POSTFIX_MAX - 1] = 0; break; } break; } default: { report_error(ERR_NONFATAL | ERR_NOFILE | ERR_USAGE, "unrecognised option `--%s'", p + 2); break; } } break; } default: if (!ofmt->setinfo(GI_SWITCH, &p)) report_error(ERR_NONFATAL | ERR_NOFILE | ERR_USAGE, "unrecognised option `-%c'", p[1]); break; } } else { if (*inname) { report_error(ERR_NONFATAL | ERR_NOFILE | ERR_USAGE, "more than one input file specified"); } else { copy_filename(inname, p); } } return advance; } #define ARG_BUF_DELTA 128 static void process_respfile(FILE * rfile) { char *buffer, *p, *q, *prevarg; int bufsize, prevargsize; bufsize = prevargsize = ARG_BUF_DELTA; buffer = nasm_malloc(ARG_BUF_DELTA); prevarg = nasm_malloc(ARG_BUF_DELTA); prevarg[0] = '\0'; while (1) { /* Loop to handle all lines in file */ p = buffer; while (1) { /* Loop to handle long lines */ q = fgets(p, bufsize - (p - buffer), rfile); if (!q) break; p += strlen(p); if (p > buffer && p[-1] == '\n') break; if (p - buffer > bufsize - 10) { int offset; offset = p - buffer; bufsize += ARG_BUF_DELTA; buffer = nasm_realloc(buffer, bufsize); p = buffer + offset; } } if (!q && p == buffer) { if (prevarg[0]) process_arg(prevarg, NULL); nasm_free(buffer); nasm_free(prevarg); return; } /* * Play safe: remove CRs, LFs and any spurious ^Zs, if any of * them are present at the end of the line. */ *(p = &buffer[strcspn(buffer, "\r\n\032")]) = '\0'; while (p > buffer && isspace(p[-1])) *--p = '\0'; p = buffer; while (isspace(*p)) p++; if (process_arg(prevarg, p)) *p = '\0'; if ((int) strlen(p) > prevargsize - 10) { prevargsize += ARG_BUF_DELTA; prevarg = nasm_realloc(prevarg, prevargsize); } strncpy(prevarg, p, prevargsize); } } /* Function to process args from a string of args, rather than the * argv array. Used by the environment variable and response file * processing. */ static void process_args(char *args) { char *p, *q, *arg, *prevarg; char separator = ' '; p = args; if (*p && *p != '-') separator = *p++; arg = NULL; while (*p) { q = p; while (*p && *p != separator) p++; while (*p == separator) *p++ = '\0'; prevarg = arg; arg = q; if (process_arg(prevarg, arg)) arg = NULL; } if (arg) process_arg(arg, NULL); } static void parse_cmdline(int argc, char **argv) { FILE *rfile; char *envreal, *envcopy = NULL, *p, *arg; *inname = *outname = *listname = *errname = '\0'; /* * First, process the NASMENV environment variable. */ envreal = getenv("NASMENV"); arg = NULL; if (envreal) { envcopy = nasm_strdup(envreal); process_args(envcopy); nasm_free(envcopy); } /* * Now process the actual command line. */ while (--argc) { bool advance; argv++; if (argv[0][0] == '@') { /* We have a response file, so process this as a set of * arguments like the environment variable. This allows us * to have multiple arguments on a single line, which is * different to the -@resp file processing below for regular * NASM. */ char *str = malloc(2048); FILE *f = fopen(&argv[0][1], "r"); if (!str) { printf("out of memory"); exit(-1); } if (f) { while (fgets(str, 2048, f)) { process_args(str); } fclose(f); } free(str); argc--; argv++; } if (!stopoptions && argv[0][0] == '-' && argv[0][1] == '@') { p = get_param(argv[0], argc > 1 ? argv[1] : NULL, &advance); if (p) { rfile = fopen(p, "r"); if (rfile) { process_respfile(rfile); fclose(rfile); } else report_error(ERR_NONFATAL | ERR_NOFILE | ERR_USAGE, "unable to open response file `%s'", p); } } else advance = process_arg(argv[0], argc > 1 ? argv[1] : NULL); argv += advance, argc -= advance; } /* Look for basic command line typos. This definitely doesn't catch all errors, but it might help cases of fumbled fingers. */ if (!*inname) report_error(ERR_NONFATAL | ERR_NOFILE | ERR_USAGE, "no input file specified"); else if (!strcmp(inname, errname) || !strcmp(inname, outname) || !strcmp(inname, listname)) report_error(ERR_FATAL | ERR_NOFILE | ERR_USAGE, "file `%s' is both input and output file", inname); if (*errname) { error_file = fopen(errname, "w"); if (!error_file) { error_file = stderr; /* Revert to default! */ report_error(ERR_FATAL | ERR_NOFILE | ERR_USAGE, "cannot open file `%s' for error messages", errname); } } } /* List of directives */ enum directives { D_NONE, D_ABSOLUTE, D_BITS, D_COMMON, D_CPU, D_DEBUG, D_DEFAULT, D_EXTERN, D_FLOAT, D_GLOBAL, D_LIST, D_SECTION, D_SEGMENT, D_WARNING }; static const char *directives[] = { "", "absolute", "bits", "common", "cpu", "debug", "default", "extern", "float", "global", "list", "section", "segment", "warning" }; static enum directives getkw(char **directive, char **value); static void assemble_file(char *fname) { char *directive, *value, *p, *q, *special, *line, debugid[80]; insn output_ins; int i, validid; bool rn_error; int32_t seg; int64_t offs; struct tokenval tokval; expr *e; int pass, pass_max; int pass_cnt = 0; /* count actual passes */ if (cmd_sb == 32 && cmd_cpu < IF_386) report_error(ERR_FATAL, "command line: " "32-bit segment size requires a higher cpu"); pass_max = (optimizing > 0 ? optimizing : 0) + 2; /* passes 1, optimizing, then 2 */ pass0 = !(optimizing > 0); /* start at 1 if not optimizing */ for (pass = 1; pass <= pass_max && pass0 <= 2; pass++) { int pass1, pass2; ldfunc def_label; pass1 = pass < pass_max ? 1 : 2; /* seq is 1, 1, 1,..., 1, 2 */ pass2 = pass > 1 ? 2 : 1; /* seq is 1, 2, 2,..., 2, 2 */ /* pass0 seq is 0, 0, 0,..., 1, 2 */ def_label = pass > 1 ? redefine_label : define_label; globalbits = sb = cmd_sb; /* set 'bits' to command line default */ cpu = cmd_cpu; if (pass0 == 2) { if (*listname) nasmlist.init(listname, report_error); } in_abs_seg = false; global_offset_changed = false; /* set by redefine_label */ location.segment = ofmt->section(NULL, pass2, &sb); globalbits = sb; if (pass > 1) { saa_rewind(forwrefs); forwref = saa_rstruct(forwrefs); raa_free(offsets); offsets = raa_init(); } preproc->reset(fname, pass1, report_error, evaluate, &nasmlist); globallineno = 0; if (pass == 1) location.known = true; location.offset = offs = GET_CURR_OFFS; while ((line = preproc->getline())) { enum directives d; globallineno++; /* here we parse our directives; this is not handled by the 'real' * parser. */ directive = line; d = getkw(&directive, &value); if (d) { int err = 0; switch (d) { case D_SEGMENT: /* [SEGMENT n] */ case D_SECTION: seg = ofmt->section(value, pass2, &sb); if (seg == NO_SEG) { report_error(pass1 == 1 ? ERR_NONFATAL : ERR_PANIC, "segment name `%s' not recognized", value); } else { in_abs_seg = false; location.segment = seg; } break; case D_EXTERN: /* [EXTERN label:special] */ if (*value == '$') value++; /* skip initial $ if present */ if (pass0 == 2) { q = value; while (*q && *q != ':') q++; if (*q == ':') { *q++ = '\0'; ofmt->symdef(value, 0L, 0L, 3, q); } } else if (pass == 1) { /* pass == 1 */ q = value; validid = true; if (!isidstart(*q)) validid = false; while (*q && *q != ':') { if (!isidchar(*q)) validid = false; q++; } if (!validid) { report_error(ERR_NONFATAL, "identifier expected after EXTERN"); break; } if (*q == ':') { *q++ = '\0'; special = q; } else special = NULL; if (!is_extern(value)) { /* allow re-EXTERN to be ignored */ int temp = pass0; pass0 = 1; /* fake pass 1 in labels.c */ declare_as_global(value, special, report_error); define_label(value, seg_alloc(), 0L, NULL, false, true, ofmt, report_error); pass0 = temp; } } /* else pass0 == 1 */ break; case D_BITS: /* [BITS bits] */ globalbits = sb = get_bits(value); break; case D_GLOBAL: /* [GLOBAL symbol:special] */ if (*value == '$') value++; /* skip initial $ if present */ if (pass0 == 2) { /* pass 2 */ q = value; while (*q && *q != ':') q++; if (*q == ':') { *q++ = '\0'; ofmt->symdef(value, 0L, 0L, 3, q); } } else if (pass2 == 1) { /* pass == 1 */ q = value; validid = true; if (!isidstart(*q)) validid = false; while (*q && *q != ':') { if (!isidchar(*q)) validid = false; q++; } if (!validid) { report_error(ERR_NONFATAL, "identifier expected after GLOBAL"); break; } if (*q == ':') { *q++ = '\0'; special = q; } else special = NULL; declare_as_global(value, special, report_error); } /* pass == 1 */ break; case D_COMMON: /* [COMMON symbol size:special] */ if (*value == '$') value++; /* skip initial $ if present */ if (pass0 == 1) { p = value; validid = true; if (!isidstart(*p)) validid = false; while (*p && !isspace(*p)) { if (!isidchar(*p)) validid = false; p++; } if (!validid) { report_error(ERR_NONFATAL, "identifier expected after COMMON"); break; } if (*p) { int64_t size; while (*p && isspace(*p)) *p++ = '\0'; q = p; while (*q && *q != ':') q++; if (*q == ':') { *q++ = '\0'; special = q; } else special = NULL; size = readnum(p, &rn_error); if (rn_error) report_error(ERR_NONFATAL, "invalid size specified" " in COMMON declaration"); else define_common(value, seg_alloc(), size, special, ofmt, report_error); } else report_error(ERR_NONFATAL, "no size specified in" " COMMON declaration"); } else if (pass0 == 2) { /* pass == 2 */ q = value; while (*q && *q != ':') { if (isspace(*q)) *q = '\0'; q++; } if (*q == ':') { *q++ = '\0'; ofmt->symdef(value, 0L, 0L, 3, q); } } break; case D_ABSOLUTE: /* [ABSOLUTE address] */ stdscan_reset(); stdscan_bufptr = value; tokval.t_type = TOKEN_INVALID; e = evaluate(stdscan, NULL, &tokval, NULL, pass2, report_error, NULL); if (e) { if (!is_reloc(e)) report_error(pass0 == 1 ? ERR_NONFATAL : ERR_PANIC, "cannot use non-relocatable expression as " "ABSOLUTE address"); else { abs_seg = reloc_seg(e); abs_offset = reloc_value(e); } } else if (pass == 1) abs_offset = 0x100; /* don't go near zero in case of / */ else report_error(ERR_PANIC, "invalid ABSOLUTE address " "in pass two"); in_abs_seg = true; location.segment = NO_SEG; break; case D_DEBUG: /* [DEBUG] */ p = value; q = debugid; validid = true; if (!isidstart(*p)) validid = false; while (*p && !isspace(*p)) { if (!isidchar(*p)) validid = false; *q++ = *p++; } *q++ = 0; if (!validid) { report_error(pass == 1 ? ERR_NONFATAL : ERR_PANIC, "identifier expected after DEBUG"); break; } while (*p && isspace(*p)) p++; if (pass == pass_max) ofmt->current_dfmt->debug_directive(debugid, p); break; case D_WARNING: /* [WARNING {+|-}warn-name] */ if (pass1 == 1) { while (*value && isspace(*value)) value++; if (*value == '+' || *value == '-') { validid = (*value == '-') ? true : false; value++; } else validid = false; for (i = 1; i <= ERR_WARN_MAX; i++) if (!nasm_stricmp(value, suppressed_names[i])) break; if (i <= ERR_WARN_MAX) suppressed[i] = validid; else report_error(ERR_NONFATAL, "invalid warning id in WARNING directive"); } break; case D_CPU: /* [CPU] */ cpu = get_cpu(value); break; case D_LIST: /* [LIST {+|-}] */ while (*value && isspace(*value)) value++; if (*value == '+') { user_nolist = 0; } else { if (*value == '-') { user_nolist = 1; } else { err = 1; } } break; case D_DEFAULT: /* [DEFAULT] */ stdscan_reset(); stdscan_bufptr = value; tokval.t_type = TOKEN_INVALID; if (stdscan(NULL, &tokval) == TOKEN_SPECIAL) { switch ((int)tokval.t_integer) { case S_REL: globalrel = 1; break; case S_ABS: globalrel = 0; break; default: err = 1; break; } } else { err = 1; } break; case D_FLOAT: if (float_option(value)) { report_error(pass1 == 1 ? ERR_NONFATAL : ERR_PANIC, "unknown 'float' directive: %s", value); } break; default: if (!ofmt->directive(directive, value, pass2)) report_error(pass1 == 1 ? ERR_NONFATAL : ERR_PANIC, "unrecognised directive [%s]", directive); } if (err) { report_error(ERR_NONFATAL, "invalid parameter to [%s] directive", directive); } } else { /* it isn't a directive */ parse_line(pass1, line, &output_ins, report_error, evaluate, def_label); if (!(optimizing > 0) && pass == 2) { if (forwref != NULL && globallineno == forwref->lineno) { output_ins.forw_ref = true; do { output_ins.oprs[forwref->operand].opflags |= OPFLAG_FORWARD; forwref = saa_rstruct(forwrefs); } while (forwref != NULL && forwref->lineno == globallineno); } else output_ins.forw_ref = false; } if (!(optimizing > 0) && output_ins.forw_ref) { if (pass == 1) { for (i = 0; i < output_ins.operands; i++) { if (output_ins.oprs[i]. opflags & OPFLAG_FORWARD) { struct forwrefinfo *fwinf = (struct forwrefinfo *) saa_wstruct(forwrefs); fwinf->lineno = globallineno; fwinf->operand = i; } } } else { /* pass == 2 */ /* * Hack to prevent phase error in the code * rol ax,x * x equ 1 * * If the second operand is a forward reference, * the UNITY property of the number 1 in that * operand is cancelled. Otherwise the above * sequence will cause a phase error. * * This hack means that the above code will * generate 286+ code. * * The forward reference will mean that the * operand will not have the UNITY property on * the first pass, so the pass behaviours will * be consistent. */ if (output_ins.operands >= 2 && (output_ins.oprs[1].opflags & OPFLAG_FORWARD) && !(IMMEDIATE & ~output_ins.oprs[1].type)) { /* Remove special properties bits */ output_ins.oprs[1].type &= ~REG_SMASK; } } /* pass == 2 */ } /* forw_ref */ if (output_ins.opcode == I_EQU) { if (pass1 == 1) { /* * Special `..' EQUs get processed in pass two, * except `..@' macro-processor EQUs which are done * in the normal place. */ if (!output_ins.label) report_error(ERR_NONFATAL, "EQU not preceded by label"); else if (output_ins.label[0] != '.' || output_ins.label[1] != '.' || output_ins.label[2] == '@') { if (output_ins.operands == 1 && (output_ins.oprs[0].type & IMMEDIATE) && output_ins.oprs[0].wrt == NO_SEG) { int isext = output_ins.oprs[0]. opflags & OPFLAG_EXTERN; def_label(output_ins.label, output_ins.oprs[0].segment, output_ins.oprs[0].offset, NULL, false, isext, ofmt, report_error); } else if (output_ins.operands == 2 && (output_ins.oprs[0]. type & IMMEDIATE) && (output_ins.oprs[0].type & COLON) && output_ins.oprs[0].segment == NO_SEG && output_ins.oprs[0].wrt == NO_SEG && (output_ins.oprs[1]. type & IMMEDIATE) && output_ins.oprs[1].segment == NO_SEG && output_ins.oprs[1].wrt == NO_SEG) { def_label(output_ins.label, output_ins.oprs[0]. offset | SEG_ABS, output_ins.oprs[1].offset, NULL, false, false, ofmt, report_error); } else report_error(ERR_NONFATAL, "bad syntax for EQU"); } } else { /* pass == 2 */ /* * Special `..' EQUs get processed here, except * `..@' macro processor EQUs which are done above. */ if (output_ins.label[0] == '.' && output_ins.label[1] == '.' && output_ins.label[2] != '@') { if (output_ins.operands == 1 && (output_ins.oprs[0].type & IMMEDIATE)) { define_label(output_ins.label, output_ins.oprs[0].segment, output_ins.oprs[0].offset, NULL, false, false, ofmt, report_error); } else if (output_ins.operands == 2 && (output_ins.oprs[0]. type & IMMEDIATE) && (output_ins.oprs[0].type & COLON) && output_ins.oprs[0].segment == NO_SEG && (output_ins.oprs[1]. type & IMMEDIATE) && output_ins.oprs[1].segment == NO_SEG) { define_label(output_ins.label, output_ins.oprs[0]. offset | SEG_ABS, output_ins.oprs[1].offset, NULL, false, false, ofmt, report_error); } else report_error(ERR_NONFATAL, "bad syntax for EQU"); } } /* pass == 2 */ } else { /* instruction isn't an EQU */ if (pass1 == 1) { int64_t l = insn_size(location.segment, offs, sb, cpu, &output_ins, report_error); /* if (using_debug_info) && output_ins.opcode != -1) */ if (using_debug_info) { /* fbk 03/25/01 */ /* this is done here so we can do debug type info */ int32_t typeinfo = TYS_ELEMENTS(output_ins.operands); switch (output_ins.opcode) { case I_RESB: typeinfo = TYS_ELEMENTS(output_ins.oprs[0]. offset) | TY_BYTE; break; case I_RESW: typeinfo = TYS_ELEMENTS(output_ins.oprs[0]. offset) | TY_WORD; break; case I_RESD: typeinfo = TYS_ELEMENTS(output_ins.oprs[0]. offset) | TY_DWORD; break; case I_RESQ: typeinfo = TYS_ELEMENTS(output_ins.oprs[0]. offset) | TY_QWORD; break; case I_REST: typeinfo = TYS_ELEMENTS(output_ins.oprs[0]. offset) | TY_TBYTE; break; case I_DB: typeinfo |= TY_BYTE; break; case I_DW: typeinfo |= TY_WORD; break; case I_DD: if (output_ins.eops_float) typeinfo |= TY_FLOAT; else typeinfo |= TY_DWORD; break; case I_DQ: typeinfo |= TY_QWORD; break; case I_DT: typeinfo |= TY_TBYTE; break; case I_DO: typeinfo |= TY_OWORD; break; default: typeinfo = TY_LABEL; } ofmt->current_dfmt->debug_typevalue(typeinfo); } if (l != -1) { offs += l; SET_CURR_OFFS(offs); } /* * else l == -1 => invalid instruction, which will be * flagged as an error on pass 2 */ } else { /* pass == 2 */ offs += assemble(location.segment, offs, sb, cpu, &output_ins, ofmt, report_error, &nasmlist); SET_CURR_OFFS(offs); } } /* not an EQU */ cleanup_insn(&output_ins); } nasm_free(line); location.offset = offs = GET_CURR_OFFS; } /* end while (line = preproc->getline... */ if (pass1 == 2 && global_offset_changed) report_error(ERR_NONFATAL, "phase error detected at end of assembly."); if (pass1 == 1) preproc->cleanup(1); if (pass1 == 1 && terminate_after_phase) { fclose(ofile); remove(outname); if (want_usage) usage(); exit(1); } pass_cnt++; if (pass > 1 && !global_offset_changed) { pass0++; if (pass0 == 2) pass = pass_max - 1; } else if (!(optimizing > 0)) pass0++; } /* for (pass=1; pass<=2; pass++) */ preproc->cleanup(0); nasmlist.cleanup(); #if 1 if (optimizing > 0 && opt_verbose_info) /* -On and -Ov switches */ fprintf(stdout, "info:: assembly required 1+%d+1 passes\n", pass_cnt - 2); #endif } /* exit from assemble_file (...) */ static enum directives getkw(char **directive, char **value) { char *p, *q, *buf; buf = *directive; /* allow leading spaces or tabs */ while (*buf == ' ' || *buf == '\t') buf++; if (*buf != '[') return 0; p = buf; while (*p && *p != ']') p++; if (!*p) return 0; q = p++; while (*p && *p != ';') { if (!isspace(*p)) return 0; p++; } q[1] = '\0'; *directive = p = buf + 1; while (*buf && *buf != ' ' && *buf != ']' && *buf != '\t') buf++; if (*buf == ']') { *buf = '\0'; *value = buf; } else { *buf++ = '\0'; while (isspace(*buf)) buf++; /* beppu - skip leading whitespace */ *value = buf; while (*buf != ']') buf++; *buf++ = '\0'; } return bsii(*directive, directives, elements(directives)); } /** * gnu style error reporting * This function prints an error message to error_file in the * style used by GNU. An example would be: * file.asm:50: error: blah blah blah * where file.asm is the name of the file, 50 is the line number on * which the error occurs (or is detected) and "error:" is one of * the possible optional diagnostics -- it can be "error" or "warning" * or something else. Finally the line terminates with the actual * error message. * * @param severity the severity of the warning or error * @param fmt the printf style format string */ static void report_error_gnu(int severity, const char *fmt, ...) { va_list ap; if (is_suppressed_warning(severity)) return; if (severity & ERR_NOFILE) fputs("nasm: ", error_file); else { char *currentfile = NULL; int32_t lineno = 0; src_get(&lineno, ¤tfile); fprintf(error_file, "%s:%"PRId32": ", currentfile, lineno); nasm_free(currentfile); } va_start(ap, fmt); report_error_common(severity, fmt, ap); va_end(ap); } /** * MS style error reporting * This function prints an error message to error_file in the * style used by Visual C and some other Microsoft tools. An example * would be: * file.asm(50) : error: blah blah blah * where file.asm is the name of the file, 50 is the line number on * which the error occurs (or is detected) and "error:" is one of * the possible optional diagnostics -- it can be "error" or "warning" * or something else. Finally the line terminates with the actual * error message. * * @param severity the severity of the warning or error * @param fmt the printf style format string */ static void report_error_vc(int severity, const char *fmt, ...) { va_list ap; if (is_suppressed_warning(severity)) return; if (severity & ERR_NOFILE) fputs("nasm: ", error_file); else { char *currentfile = NULL; int32_t lineno = 0; src_get(&lineno, ¤tfile); fprintf(error_file, "%s(%"PRId32") : ", currentfile, lineno); nasm_free(currentfile); } va_start(ap, fmt); report_error_common(severity, fmt, ap); va_end(ap); } /** * check for supressed warning * checks for suppressed warning or pass one only warning and we're * not in pass 1 * * @param severity the severity of the warning or error * @return true if we should abort error/warning printing */ static int is_suppressed_warning(int severity) { /* * See if it's a suppressed warning. */ return ((severity & ERR_MASK) == ERR_WARNING && (severity & ERR_WARN_MASK) != 0 && suppressed[(severity & ERR_WARN_MASK) >> ERR_WARN_SHR]) || /* * See if it's a pass-one only warning and we're not in pass one. */ ((severity & ERR_PASS1) && pass0 == 2); } /** * common error reporting * This is the common back end of the error reporting schemes currently * implemented. It prints the nature of the warning and then the * specific error message to error_file and may or may not return. It * doesn't return if the error severity is a "panic" or "debug" type. * * @param severity the severity of the warning or error * @param fmt the printf style format string */ static void report_error_common(int severity, const char *fmt, va_list args) { switch (severity & ERR_MASK) { case ERR_WARNING: fputs("warning: ", error_file); break; case ERR_NONFATAL: fputs("error: ", error_file); break; case ERR_FATAL: fputs("fatal: ", error_file); break; case ERR_PANIC: fputs("panic: ", error_file); break; case ERR_DEBUG: fputs("debug: ", error_file); break; } vfprintf(error_file, fmt, args); putc('\n', error_file); if (severity & ERR_USAGE) want_usage = true; switch (severity & ERR_MASK) { case ERR_DEBUG: /* no further action, by definition */ break; case ERR_WARNING: if (!suppressed[0]) /* Treat warnings as errors */ terminate_after_phase = true; break; case ERR_NONFATAL: terminate_after_phase = true; break; case ERR_FATAL: if (ofile) { fclose(ofile); remove(outname); } if (want_usage) usage(); exit(1); /* instantly die */ break; /* placate silly compilers */ case ERR_PANIC: fflush(NULL); /* abort(); *//* halt, catch fire, and dump core */ exit(3); break; } } static void usage(void) { fputs("type `nasm -h' for help\n", error_file); } static void register_output_formats(void) { ofmt = ofmt_register(report_error); } #define BUF_DELTA 512 static FILE *no_pp_fp; static efunc no_pp_err; static ListGen *no_pp_list; static int32_t no_pp_lineinc; static void no_pp_reset(char *file, int pass, efunc error, evalfunc eval, ListGen * listgen) { src_set_fname(nasm_strdup(file)); src_set_linnum(0); no_pp_lineinc = 1; no_pp_err = error; no_pp_fp = fopen(file, "r"); if (!no_pp_fp) no_pp_err(ERR_FATAL | ERR_NOFILE, "unable to open input file `%s'", file); no_pp_list = listgen; (void)pass; /* placate compilers */ (void)eval; /* placate compilers */ } static char *no_pp_getline(void) { char *buffer, *p, *q; int bufsize; bufsize = BUF_DELTA; buffer = nasm_malloc(BUF_DELTA); src_set_linnum(src_get_linnum() + no_pp_lineinc); while (1) { /* Loop to handle %line */ p = buffer; while (1) { /* Loop to handle long lines */ q = fgets(p, bufsize - (p - buffer), no_pp_fp); if (!q) break; p += strlen(p); if (p > buffer && p[-1] == '\n') break; if (p - buffer > bufsize - 10) { int offset; offset = p - buffer; bufsize += BUF_DELTA; buffer = nasm_realloc(buffer, bufsize); p = buffer + offset; } } if (!q && p == buffer) { nasm_free(buffer); return NULL; } /* * Play safe: remove CRs, LFs and any spurious ^Zs, if any of * them are present at the end of the line. */ buffer[strcspn(buffer, "\r\n\032")] = '\0'; if (!nasm_strnicmp(buffer, "%line", 5)) { int32_t ln; int li; char *nm = nasm_malloc(strlen(buffer)); if (sscanf(buffer + 5, "%"PRId32"+%d %s", &ln, &li, nm) == 3) { nasm_free(src_set_fname(nm)); src_set_linnum(ln); no_pp_lineinc = li; continue; } nasm_free(nm); } break; } no_pp_list->line(LIST_READ, buffer); return buffer; } static void no_pp_cleanup(int pass) { (void)pass; /* placate GCC */ fclose(no_pp_fp); } static uint32_t get_cpu(char *value) { if (!strcmp(value, "8086")) return IF_8086; if (!strcmp(value, "186")) return IF_186; if (!strcmp(value, "286")) return IF_286; if (!strcmp(value, "386")) return IF_386; if (!strcmp(value, "486")) return IF_486; if (!strcmp(value, "586") || !nasm_stricmp(value, "pentium")) return IF_PENT; if (!strcmp(value, "686") || !nasm_stricmp(value, "ppro") || !nasm_stricmp(value, "pentiumpro") || !nasm_stricmp(value, "p2")) return IF_P6; if (!nasm_stricmp(value, "p3") || !nasm_stricmp(value, "katmai")) return IF_KATMAI; if (!nasm_stricmp(value, "p4") || /* is this right? -- jrc */ !nasm_stricmp(value, "willamette")) return IF_WILLAMETTE; if (!nasm_stricmp(value, "prescott")) return IF_PRESCOTT; if (!nasm_stricmp(value, "x64") || !nasm_stricmp(value, "x86-64")) return IF_X86_64; if (!nasm_stricmp(value, "ia64") || !nasm_stricmp(value, "ia-64") || !nasm_stricmp(value, "itanium") || !nasm_stricmp(value, "itanic") || !nasm_stricmp(value, "merced")) return IF_IA64; report_error(pass0 < 2 ? ERR_NONFATAL : ERR_FATAL, "unknown 'cpu' type"); return IF_PLEVEL; /* the maximum level */ } static int get_bits(char *value) { int i; if ((i = atoi(value)) == 16) return i; /* set for a 16-bit segment */ else if (i == 32) { if (cpu < IF_386) { report_error(ERR_NONFATAL, "cannot specify 32-bit segment on processor below a 386"); i = 16; } } else if (i == 64) { if (cpu < IF_X86_64) { report_error(ERR_NONFATAL, "cannot specify 64-bit segment on processor below an x86-64"); i = 16; } if (i != maxbits) { report_error(ERR_NONFATAL, "%s output format does not support 64-bit code", ofmt->shortname); i = 16; } } else { report_error(pass0 < 2 ? ERR_NONFATAL : ERR_FATAL, "`%s' is not a valid segment size; must be 16, 32 or 64", value); i = 16; } return i; } /* end of nasm.c */