Mercurial > hg-old > index.cgi
view lwasm/parse.c @ 269:6cbc409ff09f 2.6
Added asprintf redux
author | lost |
---|---|
date | Tue, 22 Dec 2009 05:53:05 +0000 |
parents | 6363b9ebf825 |
children | 6d09310438a4 |
line wrap: on
line source
/* parse.c Copyright © 2008 William Astle This file is part of LWASM. LWASM is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see <http://www.gnu.org/licenses/>. */ /* Contains the general parser */ #define __parse_c_seen__ #include <config.h> #include <ctype.h> #include <string.h> #include "lwasm.h" #include "instab.h" #include "util.h" // parse a line and despatch to the appropriate handlers for opcodes int lwasm_parse_line(asmstate_t *as, lwasm_line_t *l) { char *p, *p2; char *opc; int opnum; char *sym = NULL; // if this was a bad op first pass (or otherwise a no-process line) // ignore it if (l -> badop) return; p = l -> text; l -> sect = as -> csect; l -> inmod = as -> inmod; // blank lines are a no brainer if (!*p) { as -> context = lwasm_next_context(as); return 0; } // for output generation later but only on pass 1 // also used by some pseudo ops on pass 2 if (as -> passnum == 1) l -> codeaddr = as -> addr; // check if there is a line number and ignore it if there is if (isdigit(*p)) { for (p2 = p; *p2 && isdigit(*p2); p2++) /* do nothing */ ; // we have a line number, skip it and the *first* // whitespace character if (!*p2 || isspace(*p2)) p = p2 + 1; } // if it's a comment, return (this doesn't cause a context change) if (*p == '*' || *p == ';') return; // if we have C pre-processor directives/output, ignore it if (*p == '#') return; // if we start with a non-space character, it's a symbol symbolagain: if (!isspace(*p)) { // if it starts with a comment character, it's not a symbol if (*p == ';' || *p == '*') return; // we have a symbol specified here // parse it out and record it for later use for (p2 = p; *p2 && !isspace(*p2) && *p2 != ':'; p2++) /* do nothing */ ; sym = lwasm_alloc((p2 - p) + 1); sym[p2 - p] = '\0'; memcpy(sym, p, p2 - p); p = p2; if (!*sym) { register_error(as, l, 1, "Invalid symbol"); lwasm_free(sym); sym = NULL; } if (*p == ':') p++; } l -> sym = sym; // now skip any whitespace to find the opcode while (*p && isspace(*p)) p++; // is the line blank? if (!*p && !sym) { // nothing but white space *is* a context break as -> context = lwasm_next_context(as); return; } // parse the opcode for (p2 = p; *p2 && !isspace(*p2); p2++) /* do nothing */ ; opc = lwasm_alloc((p2 - p) + 1); memcpy(opc, p, p2 - p); opc[p2 - p] = '\0'; if (strchr(opc, ':')) { lwasm_free(opc); goto symbolagain; } l -> forceglobal = 0; // if the opcode contains an =, treat it as "symbol = expr" if (!sym && strchr(opc, '=')) { for (p2 = opc; *p2 && *p2 != '='; p2++) /* do nothing */ ; sym = lwasm_alloc((p2 - opc) + 1); memcpy(sym, opc, p2 - opc); sym[p2 - opc] = '\0'; l -> sym = sym; p2 = p + (p2 - opc) + 1; // p2++; opc[0] = '='; opc[1] = '\0'; debug_message(2, "Found opcode = with symbol %s and operand %s", sym, p2); l -> forceglobal = 1; } debug_message(2, "Found operation code: '%s'", opc); // skip intervening whitespace if present while (*p2 && isspace(*p2)) p2++; // look up instruction in insn table for (opnum = 0; instab[opnum].opcode; opnum++) { if (!strcasecmp(instab[opnum].opcode, opc)) break; } // if we found no operation, check if we had a comment // the reason this check is here is to allow for "private" // operation codes like "*pragma" which will be ignored by // other assemblers // also skip empty ops if (!(instab[opnum].opcode)) { if (*opc == '*' || *opc == ';' || !*opc) goto done_line; } // now we have the opcode and the symbol, we can decide if we're // actually going to do anything with this line // we will NOT call the function if any of the following are true: // - we are skipping a condition and the operation code is not a conditional // - we are defining a macro and the operation code is not ENDM // we will call the function in any other circumstance // first condition above if (as -> inmacro && instab[opnum].endm == 0) { add_macro_line(as, l -> text); goto done_line; } // second condition above if (as -> skipcond && instab[opnum].iscond == 0) goto done_line; if (as -> instruct && as -> passnum == 1) { structtab_t *s = NULL; struct struct_sym_e *e, *e2; // look for a structure if not an acceptable opcode if (!instab[opnum].opcode) { for (s = as -> structs; s; s = s -> next) { if (s == as -> cstruct) continue; if (!strcmp(opc, s -> name)) goto isok; } } // check for a "reservation opcode" if (instab[opnum].opcode && instab[opnum].isreserve) { (instab[opnum].fn)(as, l, &p2, opnum); // if we didn't end on a "space" character or EOL, throw error if (p2 && *p2 && !isspace(*p2) && !(l -> err) && as -> passnum == 1) register_error(as, l, 1, "Bad operand: %s (%d)", p2, as -> passnum); if (as -> instruct == 0) goto done_line; goto isok; } // carp if not valid register_error(as, l, 1, "Only other structs and rmb allowed in struct"); l -> badop = 1; goto done_line; isok: for (e2 = as -> cstruct -> fields; e2 && e2 -> next; e2 = e2 -> next) /* do nothing */ ; e = lwasm_alloc(sizeof(struct struct_sym_e)); e -> next = NULL; e -> substruct = s; if (sym) e -> name = lwasm_strdup(sym); else e -> name = NULL; if (s) e -> size = s -> size; else e -> size = l -> nocodelen; if (e2) e2 -> next = e; else as -> cstruct -> fields = e; as -> cstruct -> size += e -> size; } // we've registered the symbol as needed // now we need to check for a macro call IFF we don't collide with // an operation code; otherwise, call the operation function if (instab[opnum].opcode) { if (instab[opnum].fn && !(as -> no6309 && instab[opnum].is6309)) { (instab[opnum].fn)(as, l, &p2, opnum); // if we didn't end on a "space" character or EOL, throw error if (p2 && *p2 && !isspace(*p2) && !(l -> err) && as -> passnum == 1) register_error(as, l, 1, "Bad operand: %s (%d)", p2, as -> passnum); } else { // carp about unimplemented operation if (instab[opnum].is6309) register_error(as, l, 1, "Use of 6309 operation code: %s", opc); else register_error(as, l, 1, "Unimplemented operation code: %s", opc); } } else { if (expand_macro(as, l, &p2, opc) == 0) goto done_line; if (expand_struct(as, l, &p2, opc) == 0) goto done_line; // carp about an unknown operation code and note that fact for // pass 2 in case a macro appears later with the same name! register_error(as, l, 1, "Uknown operation code: %s", opc); l -> badop = 1; } done_line: if (!(as -> skipcond || as -> inmacro)) { // register symbol if the operation didn't if (sym && instab[opnum].setsym == 0 && as -> instruct == 0) { if (as -> passnum == 1) { debug_message(1, "Registering symbol '%s' at %04X", sym, l -> codeaddr); if (lwasm_register_symbol(as, l, sym, l -> codeaddr, SYMBOL_NORM) < 0) l -> sym = NULL; else l -> addrset = 1; } } } l -> sect = as -> csect; l -> context = as -> context; lwasm_free(opc); if (sym) lwasm_free(sym); }