Mercurial > hg-old > index.cgi
annotate src/parse.c @ 185:b89adfb0d174
Added support for outputting a linkmap
author | lost |
---|---|
date | Sat, 21 Mar 2009 19:47:45 +0000 |
parents | f59c0916753d |
children |
rev | line source |
---|---|
36 | 1 /* |
2 parse.c | |
3 Copyright © 2008 William Astle | |
4 | |
5 This file is part of LWASM. | |
6 | |
7 LWASM is free software: you can redistribute it and/or modify it under the | |
8 terms of the GNU General Public License as published by the Free Software | |
9 Foundation, either version 3 of the License, or (at your option) any later | |
10 version. | |
11 | |
12 This program is distributed in the hope that it will be useful, but WITHOUT | |
13 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | |
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for | |
15 more details. | |
16 | |
17 You should have received a copy of the GNU General Public License along with | |
18 this program. If not, see <http://www.gnu.org/licenses/>. | |
19 */ | |
20 | |
21 /* | |
22 Contains the general parser | |
23 */ | |
24 | |
25 #define __parse_c_seen__ | |
26 | |
27 #include <ctype.h> | |
28 #include <string.h> | |
29 | |
30 #include "lwasm.h" | |
31 #include "instab.h" | |
32 #include "util.h" | |
33 | |
34 // parse a line and despatch to the appropriate handlers for opcodes | |
35 int lwasm_parse_line(asmstate_t *as, lwasm_line_t *l) | |
36 { | |
37 char *p, *p2; | |
38 char *opc; | |
39 int opnum; | |
44 | 40 char *sym = NULL; |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
41 |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
42 // if this was a bad op first pass (or otherwise a no-process line) |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
43 // ignore it |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
44 if (l -> badop) |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
45 return; |
36 | 46 |
47 p = l -> text; | |
101
f59c0916753d
Fixed relative branches and PCR addressing to handle constant intra-section references properly
lost
parents:
99
diff
changeset
|
48 l -> sect = as -> csect; |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
49 |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
50 // blank lines are a no brainer |
36 | 51 if (!*p) |
37
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
52 { |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
53 as -> context = lwasm_next_context(as); |
36 | 54 return 0; |
37
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
55 } |
36 | 56 |
52 | 57 // for output generation later but only on pass 1 |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
58 // also used by some pseudo ops on pass 2 |
52 | 59 if (as -> passnum == 1) |
60 l -> codeaddr = as -> addr; | |
44 | 61 |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
62 // if it's a comment, return (this doesn't cause a context change) |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
63 if (*p == '*' || *p == ';') |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
64 return; |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
65 |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
66 // if we start with a non-space character, it's a symbol |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
67 if (!isspace(*p)) |
36 | 68 { |
69 // we have a symbol specified here | |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
70 // parse it out and record it for later use |
37
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
71 for (p2 = p; *p2 && !isspace(*p2); p2++) |
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
72 /* do nothing */ ; |
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
73 |
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
74 sym = lwasm_alloc((p2 - p) + 1); |
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
75 sym[p2 - p] = '\0'; |
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
76 memcpy(sym, p, p2 - p); |
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
77 |
44 | 78 p = p2; |
37
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
79 } |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
80 l -> sym = sym; |
36 | 81 |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
82 // now skip any whitespace to find the opcode |
36 | 83 while (*p && isspace(*p)) |
84 p++; | |
85 | |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
86 // is the line blank? |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
87 if (!*p && !sym) |
37
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
88 { |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
89 // nothing but white space *is* a context break |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
90 as -> context = lwasm_next_context(as); |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
91 return; |
37
538e15927776
Added symbol handling to expression subsystem; adpated instruction handlers to the new scheme; misc fixes
lost
parents:
36
diff
changeset
|
92 } |
36 | 93 |
94 // parse the opcode | |
95 for (p2 = p; *p2 && !isspace(*p2); p2++) | |
96 /* do nothing */ ; | |
97 | |
98 opc = lwasm_alloc((p2 - p) + 1); | |
99 memcpy(opc, p, p2 - p); | |
100 opc[p2 - p] = '\0'; | |
101 | |
38 | 102 debug_message(2, "Found operation code: '%s'", opc); |
103 | |
36 | 104 // skip intervening whitespace if present |
105 while (*p2 && isspace(*p2)) | |
106 p2++; | |
107 | |
108 // look up instruction in insn table | |
109 for (opnum = 0; instab[opnum].opcode; opnum++) | |
110 { | |
111 if (!strcasecmp(instab[opnum].opcode, opc)) | |
112 break; | |
113 } | |
114 | |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
115 // if we found no operation, check if we had a comment |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
116 // the reason this check is here is to allow for "private" |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
117 // operation codes like "*pragma" which will be ignored by |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
118 // other assemblers |
68 | 119 // also skip empty ops |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
120 if (!(instab[opnum].opcode)) |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
121 { |
68 | 122 if (*opc == '*' || *opc == ';' || !*opc) |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
123 goto done_line; |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
124 } |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
125 |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
126 // now we have the opcode and the symbol, we can decide if we're |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
127 // actually going to do anything with this line |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
128 |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
129 // we will NOT call the function if any of the following are true: |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
130 |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
131 // - we are skipping a condition and the operation code is not a conditional |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
132 // - we are defining a macro and the operation code is not ENDM |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
133 |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
134 // we will call the function in any other circumstance |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
135 |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
136 // first condition above |
57 | 137 if (as -> inmacro && instab[opnum].endm == 0) |
138 { | |
139 add_macro_line(as, l -> text); | |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
140 goto done_line; |
57 | 141 } |
142 | |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
143 // second condition above |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
144 if (as -> skipcond && instab[opnum].iscond == 0) |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
145 goto done_line; |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
146 |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
147 // we've registered the symbol as needed |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
148 // now we need to check for a macro call IFF we don't collide with |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
149 // an operation code; otherwise, call the operation function |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
150 if (instab[opnum].opcode) |
36 | 151 { |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
152 if (instab[opnum].fn) |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
153 { |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
154 (instab[opnum].fn)(as, l, &p2, opnum); |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
155 } |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
156 else |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
157 { |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
158 // carp about unimplemented operation |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
159 register_error(as, l, 1, "Unimplemented operation code: %s", opc); |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
160 } |
36 | 161 } |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
162 else |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
163 { |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
164 if (expand_macro(as, l, &p2, opc) == 0) |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
165 goto done_line; |
36 | 166 |
66
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
167 // carp about an unknown operation code and note that fact for |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
168 // pass 2 in case a macro appears later with the same name! |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
169 register_error(as, l, 1, "Uknown operation code: %s", opc); |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
170 l -> badop = 1; |
aa9d9fedfdf4
Redid lwasm_parse_line() to correct overly complex logic flaws
lost
parents:
64
diff
changeset
|
171 } |
57 | 172 |
173 done_line: | |
68 | 174 if (!(as -> skipcond || as -> inmacro)) |
175 { | |
176 // register symbol if the operation didn't | |
177 if (sym && instab[opnum].setsym == 0) | |
178 { | |
179 if (as -> passnum == 1) | |
180 { | |
71
90a5657d5408
Fixed problem with symbols being registered with the address of the NEXT instruction
lost
parents:
68
diff
changeset
|
181 debug_message(1, "Registering symbol '%s' at %04X", sym, l -> codeaddr); |
90a5657d5408
Fixed problem with symbols being registered with the address of the NEXT instruction
lost
parents:
68
diff
changeset
|
182 if (lwasm_register_symbol(as, l, sym, l -> codeaddr, SYMBOL_NORM) < 0) |
68 | 183 l -> sym = NULL; |
184 else | |
185 l -> addrset = 1; | |
186 } | |
187 } | |
188 } | |
99 | 189 |
85 | 190 l -> sect = as -> csect; |
91
718998b673ee
Added incomplete references to object output and added support for section base terms in expression handler
lost
parents:
85
diff
changeset
|
191 l -> context = as -> context; |
85 | 192 |
36 | 193 lwasm_free(opc); |
44 | 194 if (sym) |
195 lwasm_free(sym); | |
36 | 196 } |