1 | /* parse_ack.c - parse GNU assembly Author: R.S. Veldema
|
---|
2 | * <rveldema@cs.vu.nl>
|
---|
3 | * 26 Aug 1996
|
---|
4 | */
|
---|
5 | #define nil 0
|
---|
6 | #include <stdio.h>
|
---|
7 | #include <stdlib.h>
|
---|
8 | #include <string.h>
|
---|
9 | #include <limits.h>
|
---|
10 | #include <assert.h>
|
---|
11 | #include "asmconv.h"
|
---|
12 | #include "token.h"
|
---|
13 | #include "asm86.h"
|
---|
14 | #include "languages.h"
|
---|
15 |
|
---|
16 | typedef struct mnemonic { /* GNU as86 mnemonics translation table. */
|
---|
17 | char *name;
|
---|
18 | opcode_t opcode;
|
---|
19 | optype_t optype;
|
---|
20 | } mnemonic_t;
|
---|
21 |
|
---|
22 | static mnemonic_t mnemtab[] = { /* This array is sorted. */
|
---|
23 | { ".align", DOT_ALIGN, PSEUDO },
|
---|
24 | { ".ascii", DOT_ASCII, PSEUDO },
|
---|
25 | { ".asciz", DOT_ASCIZ, PSEUDO },
|
---|
26 | { ".assert", DOT_ASSERT, PSEUDO },
|
---|
27 | { ".base", DOT_BASE, PSEUDO },
|
---|
28 | { ".bss", DOT_BSS, PSEUDO },
|
---|
29 | { ".byte", DOT_DATA1, PSEUDO },
|
---|
30 | { ".comm", DOT_COMM, PSEUDO },
|
---|
31 | { ".data", DOT_DATA, PSEUDO },
|
---|
32 | { ".data1", DOT_DATA1, PSEUDO },
|
---|
33 | { ".data2", DOT_DATA2, PSEUDO },
|
---|
34 | { ".data4", DOT_DATA4, PSEUDO },
|
---|
35 | { ".end", DOT_END, PSEUDO },
|
---|
36 | { ".extern", DOT_EXTERN, PSEUDO },
|
---|
37 | { ".file", DOT_FILE, PSEUDO },
|
---|
38 | { ".globl", DOT_DEFINE, PSEUDO },
|
---|
39 | { ".lcomm", DOT_LCOMM, PSEUDO },
|
---|
40 | { ".line", DOT_LINE, PSEUDO },
|
---|
41 | { ".list", DOT_LIST, PSEUDO },
|
---|
42 | { ".long", DOT_DATA4, PSEUDO },
|
---|
43 | { ".nolist", DOT_NOLIST, PSEUDO },
|
---|
44 | { ".rom", DOT_ROM, PSEUDO },
|
---|
45 | { ".space", DOT_SPACE, PSEUDO },
|
---|
46 | { ".symb", DOT_SYMB, PSEUDO },
|
---|
47 | { ".text", DOT_TEXT, PSEUDO },
|
---|
48 | { ".word", DOT_DATA2, PSEUDO },
|
---|
49 | { "aaa", AAA, WORD },
|
---|
50 | { "aad", AAD, WORD },
|
---|
51 | { "aam", AAM, WORD },
|
---|
52 | { "aas", AAS, WORD },
|
---|
53 | { "adcb", ADC, BYTE },
|
---|
54 | { "adcl", ADC, WORD },
|
---|
55 | { "adcw", ADC, OWORD },
|
---|
56 | { "addb", ADD, BYTE },
|
---|
57 | { "addl", ADD, WORD },
|
---|
58 | { "addw", ADD, OWORD },
|
---|
59 | { "andb", AND, BYTE },
|
---|
60 | { "andl", AND, WORD },
|
---|
61 | { "andw", AND, OWORD },
|
---|
62 | { "arpl", ARPL, WORD },
|
---|
63 | { "bound", BOUND, WORD },
|
---|
64 | { "bsf", BSF, WORD },
|
---|
65 | { "bsr", BSR, WORD },
|
---|
66 | { "bswap", BSWAP, WORD },
|
---|
67 | { "btc", BTC, WORD },
|
---|
68 | { "btl", BT, WORD },
|
---|
69 | { "btr", BTR, WORD },
|
---|
70 | { "bts", BTS, WORD },
|
---|
71 | { "btw", BT, OWORD },
|
---|
72 | { "call", CALL, JUMP },
|
---|
73 | { "callf", CALLF, JUMP },
|
---|
74 | { "cbtw", CBW, OWORD },
|
---|
75 | { "cbw", CBW, WORD },
|
---|
76 | { "cdq", CWD, WORD },
|
---|
77 | { "clc", CLC, WORD },
|
---|
78 | { "cld", CLD, WORD },
|
---|
79 | { "cli", CLI, WORD },
|
---|
80 | { "cltd", CWD, WORD },
|
---|
81 | { "clts", CLTS, WORD },
|
---|
82 | { "cmc", CMC, WORD },
|
---|
83 | { "cmpb", CMP, BYTE },
|
---|
84 | { "cmpl", CMP, WORD },
|
---|
85 | { "cmps", CMPS, WORD },
|
---|
86 | { "cmpsb", CMPS, BYTE },
|
---|
87 | { "cmpw", CMP, OWORD },
|
---|
88 | { "cmpxchg", CMPXCHG, WORD },
|
---|
89 | { "cwd", CWD, WORD },
|
---|
90 | { "cwde", CBW, WORD },
|
---|
91 | { "cwtd", CWD, OWORD },
|
---|
92 | { "cwtl", CBW, WORD },
|
---|
93 | { "daa", DAA, WORD },
|
---|
94 | { "das", DAS, WORD },
|
---|
95 | { "decb", DEC, BYTE },
|
---|
96 | { "decl", DEC, WORD },
|
---|
97 | { "decw", DEC, OWORD },
|
---|
98 | { "divb", DIV, BYTE },
|
---|
99 | { "divl", DIV, WORD },
|
---|
100 | { "divw", DIV, OWORD },
|
---|
101 | { "enter", ENTER, WORD },
|
---|
102 | { "f2xm1", F2XM1, WORD },
|
---|
103 | { "fabs", FABS, WORD },
|
---|
104 | { "fadd", FADD, WORD },
|
---|
105 | { "faddd", FADDD, WORD },
|
---|
106 | { "faddp", FADDP, WORD },
|
---|
107 | { "fadds", FADDS, WORD },
|
---|
108 | { "fbld", FBLD, WORD },
|
---|
109 | { "fbstp", FBSTP, WORD },
|
---|
110 | { "fchs", FCHS, WORD },
|
---|
111 | { "fcomd", FCOMD, WORD },
|
---|
112 | { "fcompd", FCOMPD, WORD },
|
---|
113 | { "fcompp", FCOMPP, WORD },
|
---|
114 | { "fcomps", FCOMPS, WORD },
|
---|
115 | { "fcoms", FCOMS, WORD },
|
---|
116 | { "fcos", FCOS, WORD },
|
---|
117 | { "fdecstp", FDECSTP, WORD },
|
---|
118 | { "fdivd", FDIVD, WORD },
|
---|
119 | { "fdivp", FDIVP, WORD },
|
---|
120 | { "fdivrd", FDIVRD, WORD },
|
---|
121 | { "fdivrp", FDIVRP, WORD },
|
---|
122 | { "fdivrs", FDIVRS, WORD },
|
---|
123 | { "fdivs", FDIVS, WORD },
|
---|
124 | { "ffree", FFREE, WORD },
|
---|
125 | { "fiaddl", FIADDL, WORD },
|
---|
126 | { "fiadds", FIADDS, WORD },
|
---|
127 | { "ficom", FICOM, WORD },
|
---|
128 | { "ficomp", FICOMP, WORD },
|
---|
129 | { "fidivl", FIDIVL, WORD },
|
---|
130 | { "fidivrl", FIDIVRL, WORD },
|
---|
131 | { "fidivrs", FIDIVRS, WORD },
|
---|
132 | { "fidivs", FIDIVS, WORD },
|
---|
133 | { "fildl", FILDL, WORD },
|
---|
134 | { "fildq", FILDQ, WORD },
|
---|
135 | { "filds", FILDS, WORD },
|
---|
136 | { "fimull", FIMULL, WORD },
|
---|
137 | { "fimuls", FIMULS, WORD },
|
---|
138 | { "fincstp", FINCSTP, WORD },
|
---|
139 | { "fistl", FISTL, WORD },
|
---|
140 | { "fistp", FISTP, WORD },
|
---|
141 | { "fists", FISTS, WORD },
|
---|
142 | { "fisubl", FISUBL, WORD },
|
---|
143 | { "fisubrl", FISUBRL, WORD },
|
---|
144 | { "fisubrs", FISUBRS, WORD },
|
---|
145 | { "fisubs", FISUBS, WORD },
|
---|
146 | { "fld1", FLD1, WORD },
|
---|
147 | { "fldcw", FLDCW, WORD },
|
---|
148 | { "fldd", FLDD, WORD },
|
---|
149 | { "fldenv", FLDENV, WORD },
|
---|
150 | { "fldl2e", FLDL2E, WORD },
|
---|
151 | { "fldl2t", FLDL2T, WORD },
|
---|
152 | { "fldlg2", FLDLG2, WORD },
|
---|
153 | { "fldln2", FLDLN2, WORD },
|
---|
154 | { "fldpi", FLDPI, WORD },
|
---|
155 | { "flds", FLDS, WORD },
|
---|
156 | { "fldx", FLDX, WORD },
|
---|
157 | { "fldz", FLDZ, WORD },
|
---|
158 | { "fmuld", FMULD, WORD },
|
---|
159 | { "fmulp", FMULP, WORD },
|
---|
160 | { "fmuls", FMULS, WORD },
|
---|
161 | { "fnclex", FCLEX, WORD },
|
---|
162 | { "fninit", FINIT, WORD },
|
---|
163 | { "fnop", FNOP, WORD },
|
---|
164 | { "fnsave", FSAVE, WORD },
|
---|
165 | { "fnstcw", FSTCW, WORD },
|
---|
166 | { "fnstenv", FSTENV, WORD },
|
---|
167 | { "fpatan", FPATAN, WORD },
|
---|
168 | { "fprem", FPREM, WORD },
|
---|
169 | { "fprem1", FPREM1, WORD },
|
---|
170 | { "fptan", FPTAN, WORD },
|
---|
171 | { "frndint", FRNDINT, WORD },
|
---|
172 | { "frstor", FRSTOR, WORD },
|
---|
173 | { "fscale", FSCALE, WORD },
|
---|
174 | { "fsin", FSIN, WORD },
|
---|
175 | { "fsincos", FSINCOS, WORD },
|
---|
176 | { "fsqrt", FSQRT, WORD },
|
---|
177 | { "fstd", FSTD, WORD },
|
---|
178 | { "fstpd", FSTPD, WORD },
|
---|
179 | { "fstps", FSTPS, WORD },
|
---|
180 | { "fstpx", FSTPX, WORD },
|
---|
181 | { "fsts", FSTS, WORD },
|
---|
182 | { "fstsw", FSTSW, WORD },
|
---|
183 | { "fsubd", FSUBD, WORD },
|
---|
184 | { "fsubp", FSUBP, WORD },
|
---|
185 | { "fsubpr", FSUBPR, WORD },
|
---|
186 | { "fsubrd", FSUBRD, WORD },
|
---|
187 | { "fsubrs", FSUBRS, WORD },
|
---|
188 | { "fsubs", FSUBS, WORD },
|
---|
189 | { "ftst", FTST, WORD },
|
---|
190 | { "fucom", FUCOM, WORD },
|
---|
191 | { "fucomp", FUCOMP, WORD },
|
---|
192 | { "fucompp", FUCOMPP, WORD },
|
---|
193 | { "fxam", FXAM, WORD },
|
---|
194 | { "fxch", FXCH, WORD },
|
---|
195 | { "fxtract", FXTRACT, WORD },
|
---|
196 | { "fyl2x", FYL2X, WORD },
|
---|
197 | { "fyl2xp1", FYL2XP1, WORD },
|
---|
198 | { "hlt", HLT, WORD },
|
---|
199 | { "idivb", IDIV, BYTE },
|
---|
200 | { "idivl", IDIV, WORD },
|
---|
201 | { "idivw", IDIV, OWORD },
|
---|
202 | { "imulb", IMUL, BYTE },
|
---|
203 | { "imull", IMUL, WORD },
|
---|
204 | { "imulw", IMUL, OWORD },
|
---|
205 | { "inb", IN, BYTE },
|
---|
206 | { "incb", INC, BYTE },
|
---|
207 | { "incl", INC, WORD },
|
---|
208 | { "incw", INC, OWORD },
|
---|
209 | { "inl", IN, WORD },
|
---|
210 | { "insb", INS, BYTE },
|
---|
211 | { "insl", INS, WORD },
|
---|
212 | { "insw", INS, OWORD },
|
---|
213 | { "int", INT, WORD },
|
---|
214 | { "into", INTO, JUMP },
|
---|
215 | { "invd", INVD, WORD },
|
---|
216 | { "invlpg", INVLPG, WORD },
|
---|
217 | { "inw", IN, OWORD },
|
---|
218 | { "iret", IRET, JUMP },
|
---|
219 | { "iretd", IRETD, JUMP },
|
---|
220 | { "ja", JA, JUMP },
|
---|
221 | { "jae", JAE, JUMP },
|
---|
222 | { "jb", JB, JUMP },
|
---|
223 | { "jbe", JBE, JUMP },
|
---|
224 | { "jc", JB, JUMP },
|
---|
225 | { "jcxz", JCXZ, JUMP },
|
---|
226 | { "je", JE, JUMP },
|
---|
227 | { "jecxz", JCXZ, JUMP },
|
---|
228 | { "jg", JG, JUMP },
|
---|
229 | { "jge", JGE, JUMP },
|
---|
230 | { "jl", JL, JUMP },
|
---|
231 | { "jle", JLE, JUMP },
|
---|
232 | { "jmp", JMP, JUMP },
|
---|
233 | { "jmpf", JMPF, JUMP },
|
---|
234 | { "jna", JBE, JUMP },
|
---|
235 | { "jnae", JB, JUMP },
|
---|
236 | { "jnb", JAE, JUMP },
|
---|
237 | { "jnbe", JA, JUMP },
|
---|
238 | { "jnc", JAE, JUMP },
|
---|
239 | { "jne", JNE, JUMP },
|
---|
240 | { "jng", JLE, JUMP },
|
---|
241 | { "jnge", JL, JUMP },
|
---|
242 | { "jnl", JGE, JUMP },
|
---|
243 | { "jnle", JG, JUMP },
|
---|
244 | { "jno", JNO, JUMP },
|
---|
245 | { "jnp", JNP, JUMP },
|
---|
246 | { "jns", JNS, JUMP },
|
---|
247 | { "jnz", JNE, JUMP },
|
---|
248 | { "jo", JO, JUMP },
|
---|
249 | { "jp", JP, JUMP },
|
---|
250 | { "js", JS, JUMP },
|
---|
251 | { "jz", JE, JUMP },
|
---|
252 | { "lahf", LAHF, WORD },
|
---|
253 | { "lar", LAR, WORD },
|
---|
254 | { "lds", LDS, WORD },
|
---|
255 | { "leal", LEA, WORD },
|
---|
256 | { "leave", LEAVE, WORD },
|
---|
257 | { "leaw", LEA, OWORD },
|
---|
258 | { "les", LES, WORD },
|
---|
259 | { "lfs", LFS, WORD },
|
---|
260 | { "lgdt", LGDT, WORD },
|
---|
261 | { "lgs", LGS, WORD },
|
---|
262 | { "lidt", LIDT, WORD },
|
---|
263 | { "lldt", LLDT, WORD },
|
---|
264 | { "lmsw", LMSW, WORD },
|
---|
265 | { "lock", LOCK, WORD },
|
---|
266 | { "lods", LODS, WORD },
|
---|
267 | { "lodsb", LODS, BYTE },
|
---|
268 | { "loop", LOOP, JUMP },
|
---|
269 | { "loope", LOOPE, JUMP },
|
---|
270 | { "loopne", LOOPNE, JUMP },
|
---|
271 | { "loopnz", LOOPNE, JUMP },
|
---|
272 | { "loopz", LOOPE, JUMP },
|
---|
273 | { "lsl", LSL, WORD },
|
---|
274 | { "lss", LSS, WORD },
|
---|
275 | { "ltr", LTR, WORD },
|
---|
276 | { "movb", MOV, BYTE },
|
---|
277 | { "movl", MOV, WORD },
|
---|
278 | { "movsb", MOVS, BYTE },
|
---|
279 | { "movsbl", MOVSXB, WORD },
|
---|
280 | { "movsbw", MOVSXB, OWORD },
|
---|
281 | { "movsl", MOVS, WORD },
|
---|
282 | { "movsw", MOVS, OWORD },
|
---|
283 | { "movswl", MOVSX, WORD },
|
---|
284 | { "movw", MOV, OWORD },
|
---|
285 | { "movzbl", MOVZXB, WORD },
|
---|
286 | { "movzbw", MOVZXB, OWORD },
|
---|
287 | { "movzwl", MOVZX, WORD },
|
---|
288 | { "mulb", MUL, BYTE },
|
---|
289 | { "mull", MUL, WORD },
|
---|
290 | { "mulw", MUL, OWORD },
|
---|
291 | { "negb", NEG, BYTE },
|
---|
292 | { "negl", NEG, WORD },
|
---|
293 | { "negw", NEG, OWORD },
|
---|
294 | { "nop", NOP, WORD },
|
---|
295 | { "notb", NOT, BYTE },
|
---|
296 | { "notl", NOT, WORD },
|
---|
297 | { "notw", NOT, OWORD },
|
---|
298 | { "orb", OR, BYTE },
|
---|
299 | { "orl", OR, WORD },
|
---|
300 | { "orw", OR, OWORD },
|
---|
301 | { "outb", OUT, BYTE },
|
---|
302 | { "outl", OUT, WORD },
|
---|
303 | { "outsb", OUTS, BYTE },
|
---|
304 | { "outsl", OUTS, WORD },
|
---|
305 | { "outsw", OUTS, OWORD },
|
---|
306 | { "outw", OUT, OWORD },
|
---|
307 | { "pop", POP, WORD },
|
---|
308 | { "popa", POPA, WORD },
|
---|
309 | { "popad", POPA, WORD },
|
---|
310 | { "popf", POPF, WORD },
|
---|
311 | { "popl", POP, WORD },
|
---|
312 | { "push", PUSH, WORD },
|
---|
313 | { "pusha", PUSHA, WORD },
|
---|
314 | { "pushad", PUSHA, WORD },
|
---|
315 | { "pushf", PUSHF, WORD },
|
---|
316 | { "pushl", PUSH, WORD },
|
---|
317 | { "rclb", RCL, BYTE },
|
---|
318 | { "rcll", RCL, WORD },
|
---|
319 | { "rclw", RCL, OWORD },
|
---|
320 | { "rcrb", RCR, BYTE },
|
---|
321 | { "rcrl", RCR, WORD },
|
---|
322 | { "rcrw", RCR, OWORD },
|
---|
323 | { "ret", RET, JUMP },
|
---|
324 | { "retf", RETF, JUMP },
|
---|
325 | { "rolb", ROL, BYTE },
|
---|
326 | { "roll", ROL, WORD },
|
---|
327 | { "rolw", ROL, OWORD },
|
---|
328 | { "rorb", ROR, BYTE },
|
---|
329 | { "rorl", ROR, WORD },
|
---|
330 | { "rorw", ROR, OWORD },
|
---|
331 | { "sahf", SAHF, WORD },
|
---|
332 | { "salb", SAL, BYTE },
|
---|
333 | { "sall", SAL, WORD },
|
---|
334 | { "salw", SAL, OWORD },
|
---|
335 | { "sarb", SAR, BYTE },
|
---|
336 | { "sarl", SAR, WORD },
|
---|
337 | { "sarw", SAR, OWORD },
|
---|
338 | { "sbbb", SBB, BYTE },
|
---|
339 | { "sbbl", SBB, WORD },
|
---|
340 | { "sbbw", SBB, OWORD },
|
---|
341 | { "scasb", SCAS, BYTE },
|
---|
342 | { "scasl", SCAS, WORD },
|
---|
343 | { "scasw", SCAS, OWORD },
|
---|
344 | { "seta", SETA, BYTE },
|
---|
345 | { "setae", SETAE, BYTE },
|
---|
346 | { "setb", SETB, BYTE },
|
---|
347 | { "setbe", SETBE, BYTE },
|
---|
348 | { "sete", SETE, BYTE },
|
---|
349 | { "setg", SETG, BYTE },
|
---|
350 | { "setge", SETGE, BYTE },
|
---|
351 | { "setl", SETL, BYTE },
|
---|
352 | { "setna", SETBE, BYTE },
|
---|
353 | { "setnae", SETB, BYTE },
|
---|
354 | { "setnb", SETAE, BYTE },
|
---|
355 | { "setnbe", SETA, BYTE },
|
---|
356 | { "setne", SETNE, BYTE },
|
---|
357 | { "setng", SETLE, BYTE },
|
---|
358 | { "setnge", SETL, BYTE },
|
---|
359 | { "setnl", SETGE, BYTE },
|
---|
360 | { "setnle", SETG, BYTE },
|
---|
361 | { "setno", SETNO, BYTE },
|
---|
362 | { "setnp", SETNP, BYTE },
|
---|
363 | { "setns", SETNS, BYTE },
|
---|
364 | { "seto", SETO, BYTE },
|
---|
365 | { "setp", SETP, BYTE },
|
---|
366 | { "sets", SETS, BYTE },
|
---|
367 | { "setz", SETE, BYTE },
|
---|
368 | { "sgdt", SGDT, WORD },
|
---|
369 | { "shlb", SHL, BYTE },
|
---|
370 | { "shldl", SHLD, WORD },
|
---|
371 | { "shll", SHL, WORD },
|
---|
372 | { "shlw", SHL, OWORD },
|
---|
373 | { "shrb", SHR, BYTE },
|
---|
374 | { "shrdl", SHRD, WORD },
|
---|
375 | { "shrl", SHR, WORD },
|
---|
376 | { "shrw", SHR, OWORD },
|
---|
377 | { "sidt", SIDT, WORD },
|
---|
378 | { "sldt", SLDT, WORD },
|
---|
379 | { "smsw", SMSW, WORD },
|
---|
380 | { "stc", STC, WORD },
|
---|
381 | { "std", STD, WORD },
|
---|
382 | { "sti", STI, WORD },
|
---|
383 | { "stosb", STOS, BYTE },
|
---|
384 | { "stosl", STOS, WORD },
|
---|
385 | { "stosw", STOS, OWORD },
|
---|
386 | { "str", STR, WORD },
|
---|
387 | { "subb", SUB, BYTE },
|
---|
388 | { "subl", SUB, WORD },
|
---|
389 | { "subw", SUB, OWORD },
|
---|
390 | { "testb", TEST, BYTE },
|
---|
391 | { "testl", TEST, WORD },
|
---|
392 | { "testw", TEST, OWORD },
|
---|
393 | { "verr", VERR, WORD },
|
---|
394 | { "verw", VERW, WORD },
|
---|
395 | { "wait", WAIT, WORD },
|
---|
396 | { "wbinvd", WBINVD, WORD },
|
---|
397 | { "xadd", XADD, WORD },
|
---|
398 | { "xchgb", XCHG, BYTE },
|
---|
399 | { "xchgl", XCHG, WORD },
|
---|
400 | { "xchgw", XCHG, OWORD },
|
---|
401 | { "xlat", XLAT, WORD },
|
---|
402 | { "xorb", XOR, BYTE },
|
---|
403 | { "xorl", XOR, WORD },
|
---|
404 | { "xorw", XOR, OWORD },
|
---|
405 | };
|
---|
406 |
|
---|
407 | void gnu_parse_init(char *file)
|
---|
408 | /* Prepare parsing of an GNU assembly file. */
|
---|
409 | {
|
---|
410 | tok_init(file, '#');
|
---|
411 | }
|
---|
412 |
|
---|
413 | static void zap(void)
|
---|
414 | /* An error, zap the rest of the line. */
|
---|
415 | {
|
---|
416 | token_t *t;
|
---|
417 |
|
---|
418 | while ((t= get_token(0))->type != T_EOF && t->symbol != ';')
|
---|
419 | skip_token(1);
|
---|
420 | }
|
---|
421 |
|
---|
422 | static mnemonic_t *search_mnem(char *name)
|
---|
423 | /* Binary search for a mnemonic. (That's why the table is sorted.) */
|
---|
424 | {
|
---|
425 | int low, mid, high;
|
---|
426 | int cmp;
|
---|
427 | mnemonic_t *m;
|
---|
428 |
|
---|
429 | low= 0;
|
---|
430 | high= arraysize(mnemtab)-1;
|
---|
431 | while (low <= high) {
|
---|
432 | mid= (low + high) / 2;
|
---|
433 | m= &mnemtab[mid];
|
---|
434 |
|
---|
435 | if ((cmp= strcmp(name, m->name)) == 0) return m;
|
---|
436 |
|
---|
437 | if (cmp < 0) high= mid-1; else low= mid+1;
|
---|
438 | }
|
---|
439 | return nil;
|
---|
440 | }
|
---|
441 |
|
---|
442 | static expression_t *gnu_get_C_expression(int *pn)
|
---|
443 | /* Read a "C-like" expression. Note that we don't worry about precedence,
|
---|
444 | * the expression is printed later like it is read. If the target language
|
---|
445 | * does not have all the operators (like ~) then this has to be repaired by
|
---|
446 | * changing the source file. (No problem, you still have one source file
|
---|
447 | * to maintain, not two.)
|
---|
448 | */
|
---|
449 | {
|
---|
450 | expression_t *e, *a1, *a2;
|
---|
451 | token_t *t;
|
---|
452 |
|
---|
453 | if ((t= get_token(*pn))->symbol == '(') {
|
---|
454 | /* ( expr ): grouping. */
|
---|
455 | (*pn)++;
|
---|
456 | if ((a1= gnu_get_C_expression(pn)) == nil) return nil;
|
---|
457 | if (get_token(*pn)->symbol != ')') {
|
---|
458 | parse_err(1, t, "missing )\n");
|
---|
459 | del_expr(a1);
|
---|
460 | return nil;
|
---|
461 | }
|
---|
462 | (*pn)++;
|
---|
463 | e= new_expr();
|
---|
464 | e->operator= '[';
|
---|
465 | e->middle= a1;
|
---|
466 | } else
|
---|
467 | if (t->type == T_WORD || t->type == T_STRING) {
|
---|
468 | /* Label, number, or string. */
|
---|
469 | e= new_expr();
|
---|
470 | e->operator= t->type == T_WORD ? 'W' : 'S';
|
---|
471 | e->name= allocate(nil, (t->len+1) * sizeof(e->name[0]));
|
---|
472 | memcpy(e->name, t->name , t->len+1);
|
---|
473 | e->len= t->len;
|
---|
474 | (*pn)++;
|
---|
475 | } else
|
---|
476 | if (t->symbol == '+' || t->symbol == '-' || t->symbol == '~') {
|
---|
477 | /* Unary operator. */
|
---|
478 | (*pn)++;
|
---|
479 | if ((a1= gnu_get_C_expression(pn)) == nil) return nil;
|
---|
480 | e= new_expr();
|
---|
481 | e->operator= t->symbol;
|
---|
482 | e->middle= a1;
|
---|
483 | } else {
|
---|
484 | parse_err(1, t, "expression syntax error\n");
|
---|
485 | return nil;
|
---|
486 | }
|
---|
487 |
|
---|
488 | switch ((t= get_token(*pn))->symbol) {
|
---|
489 | case '%':
|
---|
490 | case '+':
|
---|
491 | case '-':
|
---|
492 | case '*':
|
---|
493 | case '/':
|
---|
494 | case '&':
|
---|
495 | case '|':
|
---|
496 | case '^':
|
---|
497 | case S_LEFTSHIFT:
|
---|
498 | case S_RIGHTSHIFT:
|
---|
499 | (*pn)++;
|
---|
500 | a1= e;
|
---|
501 | if ((a2= gnu_get_C_expression(pn)) == nil) {
|
---|
502 | del_expr(a1);
|
---|
503 | return nil;
|
---|
504 | }
|
---|
505 | e= new_expr();
|
---|
506 | e->operator= t->symbol;
|
---|
507 | e->left= a1;
|
---|
508 | e->right= a2;
|
---|
509 | }
|
---|
510 | return e;
|
---|
511 | }
|
---|
512 |
|
---|
513 | static expression_t *gnu_get_operand(int *pn, int deref)
|
---|
514 | /* Get something like: $immed, memory, offset(%base,%index,scale), or simpler. */
|
---|
515 | {
|
---|
516 | expression_t *e, *offset, *base, *index;
|
---|
517 | token_t *t;
|
---|
518 | int c;
|
---|
519 |
|
---|
520 | if (get_token(*pn)->symbol == '$') {
|
---|
521 | /* An immediate value. */
|
---|
522 | (*pn)++;
|
---|
523 | return gnu_get_C_expression(pn);
|
---|
524 | }
|
---|
525 |
|
---|
526 | if (get_token(*pn)->symbol == '*') {
|
---|
527 | /* Indirection. */
|
---|
528 | (*pn)++;
|
---|
529 | if ((offset= gnu_get_operand(pn, deref)) == nil) return nil;
|
---|
530 | e= new_expr();
|
---|
531 | e->operator= '(';
|
---|
532 | e->middle= offset;
|
---|
533 | return e;
|
---|
534 | }
|
---|
535 |
|
---|
536 | if ((get_token(*pn)->symbol == '%')
|
---|
537 | && (t= get_token(*pn + 1))->type == T_WORD
|
---|
538 | && isregister(t->name)
|
---|
539 | ) {
|
---|
540 | /* A register operand. */
|
---|
541 | (*pn)+= 2;
|
---|
542 | e= new_expr();
|
---|
543 | e->operator= 'W';
|
---|
544 | e->name= copystr(t->name);
|
---|
545 | return e;
|
---|
546 | }
|
---|
547 |
|
---|
548 | /* Offset? */
|
---|
549 | if (get_token(*pn)->symbol != '('
|
---|
550 | || get_token(*pn + 1)->symbol != '%') {
|
---|
551 | /* There is an offset. */
|
---|
552 | if ((offset= gnu_get_C_expression(pn)) == nil) return nil;
|
---|
553 | } else {
|
---|
554 | /* No offset. */
|
---|
555 | offset= nil;
|
---|
556 | }
|
---|
557 |
|
---|
558 | /* (%base,%index,scale) ? */
|
---|
559 | base= index= nil;
|
---|
560 | if (get_token(*pn)->symbol == '(') {
|
---|
561 | (*pn)++;
|
---|
562 |
|
---|
563 | /* %base ? */
|
---|
564 | if (get_token(*pn)->symbol == '%'
|
---|
565 | && (t= get_token(*pn + 1))->type == T_WORD
|
---|
566 | && isregister(t->name)
|
---|
567 | ) {
|
---|
568 | /* A base register expression. */
|
---|
569 | base= new_expr();
|
---|
570 | base->operator= 'B';
|
---|
571 | base->name= copystr(t->name);
|
---|
572 | (*pn)+= 2;
|
---|
573 | }
|
---|
574 |
|
---|
575 | if (get_token(*pn)->symbol == ',') (*pn)++;
|
---|
576 |
|
---|
577 | /* %index ? */
|
---|
578 | if (get_token(*pn)->symbol == '%'
|
---|
579 | && (t= get_token(*pn + 1))->type == T_WORD
|
---|
580 | && isregister(t->name)
|
---|
581 | ) {
|
---|
582 | /* A index register expression. */
|
---|
583 | index= new_expr();
|
---|
584 | index->operator= '1'; /* for now */
|
---|
585 | index->name= copystr(t->name);
|
---|
586 | (*pn)+= 2;
|
---|
587 | }
|
---|
588 |
|
---|
589 | if (get_token(*pn)->symbol == ',') (*pn)++;
|
---|
590 |
|
---|
591 | /* scale ? */
|
---|
592 | if ((base != nil || index != nil)
|
---|
593 | && (t= get_token(*pn))->type == T_WORD
|
---|
594 | && strchr("1248", t->name[0]) != nil
|
---|
595 | && t->name[1] == 0
|
---|
596 | ) {
|
---|
597 | if (index == nil) {
|
---|
598 | /* Base is really an index register. */
|
---|
599 | index= base;
|
---|
600 | base= nil;
|
---|
601 | }
|
---|
602 | index->operator= t->name[0];
|
---|
603 | (*pn)++;
|
---|
604 | }
|
---|
605 |
|
---|
606 | if (get_token(*pn)->symbol == ')') {
|
---|
607 | /* Ending paren. */
|
---|
608 | (*pn)++;
|
---|
609 | } else {
|
---|
610 | /* Alas. */
|
---|
611 | parse_err(1, t, "operand syntax error\n");
|
---|
612 | del_expr(offset);
|
---|
613 | del_expr(base);
|
---|
614 | del_expr(index);
|
---|
615 | return nil;
|
---|
616 | }
|
---|
617 | }
|
---|
618 |
|
---|
619 | if (base == nil && index == nil) {
|
---|
620 | if (deref) {
|
---|
621 | /* Return a lone offset as (offset). */
|
---|
622 | e= new_expr();
|
---|
623 | e->operator= '(';
|
---|
624 | e->middle= offset;
|
---|
625 | } else {
|
---|
626 | /* Return a lone offset as is. */
|
---|
627 | e= offset;
|
---|
628 | }
|
---|
629 | } else {
|
---|
630 | e= new_expr();
|
---|
631 | e->operator= 'O';
|
---|
632 | e->left= offset;
|
---|
633 |
|
---|
634 | e->middle= base;
|
---|
635 | e->right= index;
|
---|
636 | }
|
---|
637 | return e;
|
---|
638 | }
|
---|
639 |
|
---|
640 | static expression_t *gnu_get_oplist(int *pn, int deref)
|
---|
641 | /* Get a comma (or colon for jmpf and callf) separated list of instruction
|
---|
642 | * operands.
|
---|
643 | */
|
---|
644 | {
|
---|
645 | expression_t *e, *o1, *o2;
|
---|
646 | token_t *t;
|
---|
647 |
|
---|
648 | if ((e= gnu_get_operand(pn, deref)) == nil) return nil;
|
---|
649 |
|
---|
650 | if ((t= get_token(*pn))->symbol == ',' || t->symbol == ':') {
|
---|
651 | o1= e;
|
---|
652 | (*pn)++;
|
---|
653 | if ((o2= gnu_get_oplist(pn, deref)) == nil) {
|
---|
654 | del_expr(o1);
|
---|
655 | return nil;
|
---|
656 | }
|
---|
657 | e= new_expr();
|
---|
658 | e->operator= ',';
|
---|
659 | e->left= o1;
|
---|
660 | e->right= o2;
|
---|
661 | }
|
---|
662 | return e;
|
---|
663 | }
|
---|
664 |
|
---|
665 |
|
---|
666 | static asm86_t *gnu_get_statement(void)
|
---|
667 | /* Get a pseudo op or machine instruction with arguments. */
|
---|
668 | {
|
---|
669 | token_t *t= get_token(0);
|
---|
670 | asm86_t *a;
|
---|
671 | mnemonic_t *m;
|
---|
672 | int n;
|
---|
673 | int prefix_seen;
|
---|
674 | int deref;
|
---|
675 |
|
---|
676 | assert(t->type == T_WORD);
|
---|
677 |
|
---|
678 | a= new_asm86();
|
---|
679 |
|
---|
680 | /* Process instruction prefixes. */
|
---|
681 | for (prefix_seen= 0;; prefix_seen= 1) {
|
---|
682 | if (strcmp(t->name, "rep") == 0
|
---|
683 | || strcmp(t->name, "repe") == 0
|
---|
684 | || strcmp(t->name, "repne") == 0
|
---|
685 | || strcmp(t->name, "repz") == 0
|
---|
686 | || strcmp(t->name, "repnz") == 0
|
---|
687 | ) {
|
---|
688 | if (a->rep != ONCE) {
|
---|
689 | parse_err(1, t,
|
---|
690 | "can't have more than one rep\n");
|
---|
691 | }
|
---|
692 | switch (t->name[3]) {
|
---|
693 | case 0: a->rep= REP; break;
|
---|
694 | case 'e':
|
---|
695 | case 'z': a->rep= REPE; break;
|
---|
696 | case 'n': a->rep= REPNE; break;
|
---|
697 | }
|
---|
698 | } else
|
---|
699 | if (!prefix_seen) {
|
---|
700 | /* No prefix here, get out! */
|
---|
701 | break;
|
---|
702 | } else {
|
---|
703 | /* No more prefixes, next must be an instruction. */
|
---|
704 | if (t->type != T_WORD
|
---|
705 | || (m= search_mnem(t->name)) == nil
|
---|
706 | || m->optype == PSEUDO
|
---|
707 | ) {
|
---|
708 | parse_err(1, t,
|
---|
709 | "machine instruction expected after instruction prefix\n");
|
---|
710 | del_asm86(a);
|
---|
711 | return nil;
|
---|
712 | }
|
---|
713 | break;
|
---|
714 | }
|
---|
715 |
|
---|
716 | /* Skip the prefix and extra newlines. */
|
---|
717 | do {
|
---|
718 | skip_token(1);
|
---|
719 | } while ((t= get_token(0))->symbol == ';');
|
---|
720 | }
|
---|
721 |
|
---|
722 | /* All the readahead being done upsets the line counter. */
|
---|
723 | a->line= t->line;
|
---|
724 |
|
---|
725 | /* Read a machine instruction or pseudo op. */
|
---|
726 | if ((m= search_mnem(t->name)) == nil) {
|
---|
727 | parse_err(1, t, "unknown instruction '%s'\n", t->name);
|
---|
728 | del_asm86(a);
|
---|
729 | return nil;
|
---|
730 | }
|
---|
731 | a->opcode= m->opcode;
|
---|
732 | a->optype= m->optype;
|
---|
733 | a->oaz= 0;
|
---|
734 | if (a->optype == OWORD) {
|
---|
735 | a->oaz|= OPZ;
|
---|
736 | a->optype= WORD;
|
---|
737 | }
|
---|
738 |
|
---|
739 | switch (a->opcode) {
|
---|
740 | case IN:
|
---|
741 | case OUT:
|
---|
742 | case INT:
|
---|
743 | deref= 0;
|
---|
744 | break;
|
---|
745 | default:
|
---|
746 | deref= (a->optype >= BYTE);
|
---|
747 | }
|
---|
748 | n= 1;
|
---|
749 | if (get_token(1)->symbol != ';'
|
---|
750 | && (a->args= gnu_get_oplist(&n, deref)) == nil) {
|
---|
751 | del_asm86(a);
|
---|
752 | return nil;
|
---|
753 | }
|
---|
754 | if (get_token(n)->symbol != ';') {
|
---|
755 | parse_err(1, t, "garbage at end of instruction\n");
|
---|
756 | del_asm86(a);
|
---|
757 | return nil;
|
---|
758 | }
|
---|
759 | if (!is_pseudo(a->opcode)) {
|
---|
760 | /* GNU operand order is the other way around. */
|
---|
761 | expression_t *e, *t;
|
---|
762 |
|
---|
763 | e= a->args;
|
---|
764 | while (e != nil && e->operator == ',') {
|
---|
765 | t= e->right; e->right= e->left; e->left= t;
|
---|
766 | e= e->left;
|
---|
767 | }
|
---|
768 | }
|
---|
769 | switch (a->opcode) {
|
---|
770 | case DOT_ALIGN:
|
---|
771 | /* Delete two argument .align, because ACK can't do it.
|
---|
772 | * Raise 2 to the power of .align's argument.
|
---|
773 | */
|
---|
774 | if (a->args == nil || a->args->operator != 'W') {
|
---|
775 | del_asm86(a);
|
---|
776 | return nil;
|
---|
777 | }
|
---|
778 | if (a->args != nil && a->args->operator == 'W'
|
---|
779 | && isanumber(a->args->name)
|
---|
780 | ) {
|
---|
781 | unsigned n;
|
---|
782 | char num[sizeof(int) * CHAR_BIT / 3 + 1];
|
---|
783 |
|
---|
784 | n= 1 << strtoul(a->args->name, nil, 0);
|
---|
785 | sprintf(num, "%u", n);
|
---|
786 | deallocate(a->args->name);
|
---|
787 | a->args->name= copystr(num);
|
---|
788 | }
|
---|
789 | break;
|
---|
790 | case JMPF:
|
---|
791 | case CALLF:
|
---|
792 | /*FALL THROUGH*/
|
---|
793 | case JMP:
|
---|
794 | case CALL:
|
---|
795 | break;
|
---|
796 | default:;
|
---|
797 | }
|
---|
798 | skip_token(n+1);
|
---|
799 | return a;
|
---|
800 | }
|
---|
801 |
|
---|
802 |
|
---|
803 | asm86_t *gnu_get_instruction(void)
|
---|
804 | {
|
---|
805 | asm86_t *a= nil;
|
---|
806 | expression_t *e;
|
---|
807 | token_t *t;
|
---|
808 |
|
---|
809 | while ((t= get_token(0))->symbol == ';' || t->symbol == '/') {
|
---|
810 | zap(); /* if a comment started by a '/' */
|
---|
811 | skip_token(1);
|
---|
812 | }
|
---|
813 |
|
---|
814 | if (t->type == T_EOF) return nil;
|
---|
815 |
|
---|
816 | if (t->symbol == '#') {
|
---|
817 | /* Preprocessor line and file change. */
|
---|
818 |
|
---|
819 | if ((t= get_token(1))->type != T_WORD || !isanumber(t->name)
|
---|
820 | || get_token(2)->type != T_STRING
|
---|
821 | ) {
|
---|
822 | parse_err(1, t, "file not preprocessed?\n");
|
---|
823 | zap();
|
---|
824 | } else {
|
---|
825 | set_file(get_token(2)->name,
|
---|
826 | strtol(get_token(1)->name, nil, 0) - 1);
|
---|
827 |
|
---|
828 | /* GNU CPP adds extra cruft, simply zap the line. */
|
---|
829 | zap();
|
---|
830 | }
|
---|
831 | a= gnu_get_instruction();
|
---|
832 | } else
|
---|
833 | if (t->type == T_WORD && get_token(1)->symbol == ':') {
|
---|
834 | /* A label definition. */
|
---|
835 |
|
---|
836 | a= new_asm86();
|
---|
837 | a->line= t->line;
|
---|
838 | a->opcode= DOT_LABEL;
|
---|
839 | a->optype= PSEUDO;
|
---|
840 | a->args= e= new_expr();
|
---|
841 | e->operator= ':';
|
---|
842 | e->name= copystr(t->name);
|
---|
843 | skip_token(2);
|
---|
844 | } else
|
---|
845 | if (t->type == T_WORD && get_token(1)->symbol == '=') {
|
---|
846 | int n= 2;
|
---|
847 |
|
---|
848 | if ((e= gnu_get_C_expression(&n)) == nil) {
|
---|
849 | zap();
|
---|
850 | a= gnu_get_instruction();
|
---|
851 | } else
|
---|
852 | if (get_token(n)->symbol != ';') {
|
---|
853 | parse_err(1, t, "garbage after assignment\n");
|
---|
854 | zap();
|
---|
855 | a= gnu_get_instruction();
|
---|
856 | } else {
|
---|
857 | a= new_asm86();
|
---|
858 | a->line= t->line;
|
---|
859 | a->opcode= DOT_EQU;
|
---|
860 | a->optype= PSEUDO;
|
---|
861 | a->args= new_expr();
|
---|
862 | a->args->operator= '=';
|
---|
863 | a->args->name= copystr(t->name);
|
---|
864 | a->args->middle= e;
|
---|
865 | skip_token(n+1);
|
---|
866 | }
|
---|
867 | } else
|
---|
868 | if (t->type == T_WORD) {
|
---|
869 | if ((a= gnu_get_statement()) == nil) {
|
---|
870 | zap();
|
---|
871 | a= gnu_get_instruction();
|
---|
872 | }
|
---|
873 | } else {
|
---|
874 | parse_err(1, t, "syntax error\n");
|
---|
875 | zap();
|
---|
876 | a= gnu_get_instruction();
|
---|
877 | }
|
---|
878 | return a;
|
---|
879 | }
|
---|