]>
Commit | Line | Data |
---|---|---|
fecd2382 | 1 | /* expr.c -operands, expressions- |
f2f7d044 | 2 | Copyright (C) 1987, 1990, 1991, 1992, 1993 Free Software Foundation, Inc. |
2ed83a59 | 3 | |
a39116f1 | 4 | This file is part of GAS, the GNU Assembler. |
2ed83a59 | 5 | |
a39116f1 RP |
6 | GAS is free software; you can redistribute it and/or modify |
7 | it under the terms of the GNU General Public License as published by | |
8 | the Free Software Foundation; either version 2, or (at your option) | |
9 | any later version. | |
2ed83a59 | 10 | |
a39116f1 RP |
11 | GAS is distributed in the hope that it will be useful, |
12 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
13 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
14 | GNU General Public License for more details. | |
2ed83a59 | 15 | |
a39116f1 RP |
16 | You should have received a copy of the GNU General Public License |
17 | along with GAS; see the file COPYING. If not, write to | |
18 | the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */ | |
fecd2382 RP |
19 | |
20 | /* | |
21 | * This is really a branch office of as-read.c. I split it out to clearly | |
22 | * distinguish the world of expressions from the world of statements. | |
23 | * (It also gives smaller files to re-compile.) | |
24 | * Here, "operand"s are of expressions, not instructions. | |
25 | */ | |
26 | ||
27 | #include <ctype.h> | |
28 | #include <string.h> | |
29 | ||
30 | #include "as.h" | |
31 | ||
32 | #include "obstack.h" | |
33 | ||
d4c8cbd8 JL |
34 | static void floating_constant PARAMS ((expressionS * expressionP)); |
35 | static void integer_constant PARAMS ((int radix, expressionS * expressionP)); | |
f2f7d044 | 36 | static void clean_up_expression PARAMS ((expressionS * expressionP)); |
5ac34ac3 ILT |
37 | static symbolS *make_expr_symbol PARAMS ((expressionS * expressionP)); |
38 | ||
f2f7d044 | 39 | extern const char EXP_CHARS[], FLT_CHARS[]; |
5ac34ac3 ILT |
40 | \f |
41 | /* Build a dummy symbol to hold a complex expression. This is how we | |
42 | build expressions up out of other expressions. The symbol is put | |
43 | into the fake section expr_section. */ | |
44 | ||
45 | static symbolS * | |
46 | make_expr_symbol (expressionP) | |
47 | expressionS *expressionP; | |
48 | { | |
49 | const char *fake; | |
50 | symbolS *symbolP; | |
fecd2382 | 51 | |
5ac34ac3 ILT |
52 | /* FIXME: This should be something which decode_local_label_name |
53 | will handle. */ | |
d4c8cbd8 JL |
54 | fake = FAKE_LABEL_NAME; |
55 | ||
5ac34ac3 ILT |
56 | /* Putting constant symbols in absolute_section rather than |
57 | expr_section is convenient for the old a.out code, for which | |
58 | S_GET_SEGMENT does not always retrieve the value put in by | |
59 | S_SET_SEGMENT. */ | |
60 | symbolP = symbol_new (fake, | |
61 | (expressionP->X_op == O_constant | |
62 | ? absolute_section | |
63 | : expr_section), | |
64 | 0, &zero_address_frag); | |
65 | symbolP->sy_value = *expressionP; | |
66 | return symbolP; | |
67 | } | |
68 | \f | |
fecd2382 RP |
69 | /* |
70 | * Build any floating-point literal here. | |
71 | * Also build any bignum literal here. | |
72 | */ | |
73 | ||
fecd2382 RP |
74 | /* Seems atof_machine can backscan through generic_bignum and hit whatever |
75 | happens to be loaded before it in memory. And its way too complicated | |
76 | for me to fix right. Thus a hack. JF: Just make generic_bignum bigger, | |
77 | and never write into the early words, thus they'll always be zero. | |
f2f7d044 | 78 | I hate Dean's floating-point code. Bleh. */ |
2ed83a59 KR |
79 | LITTLENUM_TYPE generic_bignum[SIZE_OF_LARGE_NUMBER + 6]; |
80 | FLONUM_TYPE generic_floating_point_number = | |
fecd2382 | 81 | { |
2ed83a59 | 82 | &generic_bignum[6], /* low (JF: Was 0) */ |
351878df | 83 | &generic_bignum[SIZE_OF_LARGE_NUMBER + 6 - 1], /* high JF: (added +6) */ |
2ed83a59 KR |
84 | 0, /* leader */ |
85 | 0, /* exponent */ | |
86 | 0 /* sign */ | |
87 | }; | |
fecd2382 RP |
88 | /* If nonzero, we've been asked to assemble nan, +inf or -inf */ |
89 | int generic_floating_point_magic; | |
90 | \f | |
d4c8cbd8 | 91 | static void |
2ed83a59 KR |
92 | floating_constant (expressionP) |
93 | expressionS *expressionP; | |
c593cf41 SC |
94 | { |
95 | /* input_line_pointer->*/ | |
96 | /* floating-point constant. */ | |
97 | int error_code; | |
98 | ||
351878df KR |
99 | error_code = atof_generic (&input_line_pointer, ".", EXP_CHARS, |
100 | &generic_floating_point_number); | |
c593cf41 SC |
101 | |
102 | if (error_code) | |
c593cf41 | 103 | { |
2ed83a59 KR |
104 | if (error_code == ERROR_EXPONENT_OVERFLOW) |
105 | { | |
106 | as_bad ("bad floating-point constant: exponent overflow, probably assembling junk"); | |
107 | } | |
108 | else | |
109 | { | |
110 | as_bad ("bad floating-point constant: unknown error code=%d.", error_code); | |
111 | } | |
c593cf41 | 112 | } |
5ac34ac3 | 113 | expressionP->X_op = O_big; |
c593cf41 SC |
114 | /* input_line_pointer->just after constant, */ |
115 | /* which may point to whitespace. */ | |
2ed83a59 | 116 | expressionP->X_add_number = -1; |
c593cf41 SC |
117 | } |
118 | ||
d4c8cbd8 | 119 | static void |
2ed83a59 KR |
120 | integer_constant (radix, expressionP) |
121 | int radix; | |
122 | expressionS *expressionP; | |
c593cf41 | 123 | { |
7691379e | 124 | char *start; /* start of number. */ |
c593cf41 | 125 | char c; |
2ed83a59 | 126 | |
dae92eab KR |
127 | valueT number; /* offset or (absolute) value */ |
128 | short int digit; /* value of next digit in current radix */ | |
129 | short int maxdig = 0;/* highest permitted digit value. */ | |
130 | int too_many_digits = 0; /* if we see >= this number of */ | |
131 | char *name; /* points to name of symbol */ | |
132 | symbolS *symbolP; /* points to symbol */ | |
2ed83a59 KR |
133 | |
134 | int small; /* true if fits in 32 bits. */ | |
f2f7d044 | 135 | extern const char hex_value[]; /* in hex_value.c */ |
2ed83a59 | 136 | |
dae92eab KR |
137 | /* May be bignum, or may fit in 32 bits. */ |
138 | /* Most numbers fit into 32 bits, and we want this case to be fast. | |
139 | so we pretend it will fit into 32 bits. If, after making up a 32 | |
140 | bit number, we realise that we have scanned more digits than | |
141 | comfortably fit into 32 bits, we re-scan the digits coding them | |
142 | into a bignum. For decimal and octal numbers we are | |
143 | conservative: Some numbers may be assumed bignums when in fact | |
144 | they do fit into 32 bits. Numbers of any radix can have excess | |
145 | leading zeros: We strive to recognise this and cast them back | |
146 | into 32 bits. We must check that the bignum really is more than | |
147 | 32 bits, and change it back to a 32-bit number if it fits. The | |
148 | number we are looking for is expected to be positive, but if it | |
149 | fits into 32 bits as an unsigned number, we let it be a 32-bit | |
150 | number. The cavalier approach is for speed in ordinary cases. */ | |
58d4951d ILT |
151 | /* This has been extended for 64 bits. We blindly assume that if |
152 | you're compiling in 64-bit mode, the target is a 64-bit machine. | |
153 | This should be cleaned up. */ | |
154 | ||
155 | #ifdef BFD64 | |
156 | #define valuesize 64 | |
157 | #else /* includes non-bfd case, mostly */ | |
158 | #define valuesize 32 | |
159 | #endif | |
2ed83a59 KR |
160 | |
161 | switch (radix) | |
f8701a3f | 162 | { |
f8701a3f SC |
163 | case 2: |
164 | maxdig = 2; | |
58d4951d | 165 | too_many_digits = valuesize + 1; |
f8701a3f SC |
166 | break; |
167 | case 8: | |
168 | maxdig = radix = 8; | |
7691379e | 169 | too_many_digits = (valuesize + 2) / 3 + 1; |
f8701a3f SC |
170 | break; |
171 | case 16: | |
f8701a3f | 172 | maxdig = radix = 16; |
7691379e | 173 | too_many_digits = (valuesize + 3) / 4 + 1; |
f8701a3f SC |
174 | break; |
175 | case 10: | |
176 | maxdig = radix = 10; | |
58d4951d | 177 | too_many_digits = (valuesize + 12) / 4; /* very rough */ |
f8701a3f | 178 | } |
58d4951d | 179 | #undef valuesize |
7691379e KR |
180 | start = input_line_pointer; |
181 | c = *input_line_pointer++; | |
58d4951d ILT |
182 | for (number = 0; |
183 | (digit = hex_value[(unsigned char) c]) < maxdig; | |
184 | c = *input_line_pointer++) | |
f8701a3f SC |
185 | { |
186 | number = number * radix + digit; | |
187 | } | |
c593cf41 SC |
188 | /* c contains character after number. */ |
189 | /* input_line_pointer->char after c. */ | |
7691379e | 190 | small = (input_line_pointer - start - 1) < too_many_digits; |
2ed83a59 | 191 | if (!small) |
c593cf41 | 192 | { |
f8701a3f SC |
193 | /* |
194 | * we saw a lot of digits. manufacture a bignum the hard way. | |
195 | */ | |
2ed83a59 KR |
196 | LITTLENUM_TYPE *leader; /*->high order littlenum of the bignum. */ |
197 | LITTLENUM_TYPE *pointer; /*->littlenum we are frobbing now. */ | |
f8701a3f | 198 | long carry; |
2ed83a59 | 199 | |
f8701a3f | 200 | leader = generic_bignum; |
2ed83a59 KR |
201 | generic_bignum[0] = 0; |
202 | generic_bignum[1] = 0; | |
7691379e | 203 | input_line_pointer = start; /*->1st digit. */ |
f8701a3f | 204 | c = *input_line_pointer++; |
58d4951d ILT |
205 | for (; |
206 | (carry = hex_value[(unsigned char) c]) < maxdig; | |
207 | c = *input_line_pointer++) | |
f8701a3f SC |
208 | { |
209 | for (pointer = generic_bignum; | |
210 | pointer <= leader; | |
211 | pointer++) | |
212 | { | |
213 | long work; | |
2ed83a59 KR |
214 | |
215 | work = carry + radix * *pointer; | |
f8701a3f SC |
216 | *pointer = work & LITTLENUM_MASK; |
217 | carry = work >> LITTLENUM_NUMBER_OF_BITS; | |
218 | } | |
219 | if (carry) | |
220 | { | |
221 | if (leader < generic_bignum + SIZE_OF_LARGE_NUMBER - 1) | |
351878df KR |
222 | { |
223 | /* room to grow a longer bignum. */ | |
f8701a3f SC |
224 | *++leader = carry; |
225 | } | |
226 | } | |
227 | } | |
228 | /* again, c is char after number, */ | |
229 | /* input_line_pointer->after c. */ | |
2ed83a59 | 230 | know (LITTLENUM_NUMBER_OF_BITS == 16); |
7691379e | 231 | if (leader < generic_bignum + 2) |
351878df KR |
232 | { |
233 | /* will fit into 32 bits. */ | |
f8701a3f | 234 | number = |
2ed83a59 KR |
235 | ((generic_bignum[1] & LITTLENUM_MASK) << LITTLENUM_NUMBER_OF_BITS) |
236 | | (generic_bignum[0] & LITTLENUM_MASK); | |
f8701a3f SC |
237 | small = 1; |
238 | } | |
239 | else | |
240 | { | |
2ed83a59 | 241 | number = leader - generic_bignum + 1; /* number of littlenums in the bignum. */ |
c593cf41 | 242 | } |
c593cf41 | 243 | } |
2ed83a59 KR |
244 | if (small) |
245 | { | |
f8701a3f | 246 | /* |
2ed83a59 KR |
247 | * here with number, in correct radix. c is the next char. |
248 | * note that unlike un*x, we allow "011f" "0x9f" to | |
249 | * both mean the same as the (conventional) "9f". this is simply easier | |
250 | * than checking for strict canonical form. syntax sux! | |
f8701a3f | 251 | */ |
2ed83a59 KR |
252 | |
253 | switch (c) | |
254 | { | |
255 | ||
256 | #ifdef LOCAL_LABELS_FB | |
257 | case 'b': | |
258 | { | |
259 | /* | |
260 | * backward ref to local label. | |
261 | * because it is backward, expect it to be defined. | |
262 | */ | |
263 | /* Construct a local label. */ | |
264 | name = fb_label_name ((int) number, 0); | |
265 | ||
266 | /* seen before, or symbol is defined: ok */ | |
267 | symbolP = symbol_find (name); | |
268 | if ((symbolP != NULL) && (S_IS_DEFINED (symbolP))) | |
269 | { | |
270 | ||
271 | /* local labels are never absolute. don't waste time | |
272 | checking absoluteness. */ | |
273 | know (SEG_NORMAL (S_GET_SEGMENT (symbolP))); | |
274 | ||
5ac34ac3 | 275 | expressionP->X_op = O_symbol; |
2ed83a59 | 276 | expressionP->X_add_symbol = symbolP; |
2ed83a59 KR |
277 | |
278 | } | |
279 | else | |
dae92eab KR |
280 | { |
281 | /* either not seen or not defined. */ | |
282 | /* @@ Should print out the original string instead of | |
283 | the parsed number. */ | |
284 | as_bad ("backw. ref to unknown label \"%d:\", 0 assumed.", | |
285 | (int) number); | |
5ac34ac3 | 286 | expressionP->X_op = O_constant; |
2ed83a59 KR |
287 | } |
288 | ||
289 | expressionP->X_add_number = 0; | |
290 | break; | |
291 | } /* case 'b' */ | |
292 | ||
293 | case 'f': | |
294 | { | |
295 | /* | |
296 | * forward reference. expect symbol to be undefined or | |
297 | * unknown. undefined: seen it before. unknown: never seen | |
298 | * it before. | |
299 | * construct a local label name, then an undefined symbol. | |
300 | * don't create a xseg frag for it: caller may do that. | |
301 | * just return it as never seen before. | |
302 | */ | |
303 | name = fb_label_name ((int) number, 1); | |
304 | symbolP = symbol_find_or_make (name); | |
305 | /* we have no need to check symbol properties. */ | |
c593cf41 | 306 | #ifndef many_segments |
2ed83a59 KR |
307 | /* since "know" puts its arg into a "string", we |
308 | can't have newlines in the argument. */ | |
f2f7d044 | 309 | know (S_GET_SEGMENT (symbolP) == undefined_section || S_GET_SEGMENT (symbolP) == text_section || S_GET_SEGMENT (symbolP) == data_section); |
c593cf41 | 310 | #endif |
5ac34ac3 | 311 | expressionP->X_op = O_symbol; |
2ed83a59 | 312 | expressionP->X_add_symbol = symbolP; |
2ed83a59 KR |
313 | expressionP->X_add_number = 0; |
314 | ||
315 | break; | |
316 | } /* case 'f' */ | |
317 | ||
f8701a3f | 318 | #endif /* LOCAL_LABELS_FB */ |
2ed83a59 | 319 | |
f8701a3f | 320 | #ifdef LOCAL_LABELS_DOLLAR |
f8701a3f | 321 | |
2ed83a59 KR |
322 | case '$': |
323 | { | |
324 | ||
325 | /* If the dollar label is *currently* defined, then this is just | |
326 | another reference to it. If it is not *currently* defined, | |
327 | then this is a fresh instantiation of that number, so create | |
328 | it. */ | |
329 | ||
d4c8cbd8 | 330 | if (dollar_label_defined ((long) number)) |
2ed83a59 | 331 | { |
d4c8cbd8 | 332 | name = dollar_label_name ((long) number, 0); |
2ed83a59 KR |
333 | symbolP = symbol_find (name); |
334 | know (symbolP != NULL); | |
335 | } | |
336 | else | |
337 | { | |
d4c8cbd8 | 338 | name = dollar_label_name ((long) number, 1); |
2ed83a59 KR |
339 | symbolP = symbol_find_or_make (name); |
340 | } | |
341 | ||
5ac34ac3 | 342 | expressionP->X_op = O_symbol; |
2ed83a59 KR |
343 | expressionP->X_add_symbol = symbolP; |
344 | expressionP->X_add_number = 0; | |
2ed83a59 KR |
345 | |
346 | break; | |
347 | } /* case '$' */ | |
348 | ||
f8701a3f | 349 | #endif /* LOCAL_LABELS_DOLLAR */ |
2ed83a59 KR |
350 | |
351 | default: | |
352 | { | |
5ac34ac3 | 353 | expressionP->X_op = O_constant; |
2ed83a59 | 354 | expressionP->X_add_number = number; |
2ed83a59 KR |
355 | input_line_pointer--; /* restore following character. */ |
356 | break; | |
357 | } /* really just a number */ | |
358 | ||
359 | } /* switch on char following the number */ | |
360 | ||
2ed83a59 KR |
361 | } |
362 | else | |
dae92eab KR |
363 | { |
364 | /* not a small number */ | |
5ac34ac3 | 365 | expressionP->X_op = O_big; |
7691379e | 366 | expressionP->X_add_number = number; /* number of littlenums */ |
2ed83a59 | 367 | input_line_pointer--; /*->char following number. */ |
dae92eab | 368 | } |
d4c8cbd8 | 369 | } |
c593cf41 SC |
370 | |
371 | ||
fecd2382 RP |
372 | /* |
373 | * Summary of operand(). | |
374 | * | |
375 | * in: Input_line_pointer points to 1st char of operand, which may | |
376 | * be a space. | |
377 | * | |
5ac34ac3 ILT |
378 | * out: A expressionS. |
379 | * The operand may have been empty: in this case X_op == O_absent. | |
fecd2382 | 380 | * Input_line_pointer->(next non-blank) char after operand. |
fecd2382 | 381 | */ |
c593cf41 | 382 | |
fecd2382 | 383 | static segT |
c593cf41 | 384 | operand (expressionP) |
dae92eab | 385 | expressionS *expressionP; |
fecd2382 | 386 | { |
dae92eab KR |
387 | char c; |
388 | symbolS *symbolP; /* points to symbol */ | |
389 | char *name; /* points to name of symbol */ | |
58d4951d | 390 | segT segment; |
c593cf41 | 391 | |
d4c8cbd8 JL |
392 | /* All integers are regarded as unsigned unless they are negated. |
393 | This is because the only thing which cares whether a number is | |
394 | unsigned is the code in emit_expr which extends constants into | |
395 | bignums. It should only sign extend negative numbers, so that | |
396 | something like ``.quad 0x80000000'' is not sign extended even | |
397 | though it appears negative if valueT is 32 bits. */ | |
398 | expressionP->X_unsigned = 1; | |
399 | ||
c593cf41 SC |
400 | /* digits, assume it is a bignum. */ |
401 | ||
2ed83a59 KR |
402 | SKIP_WHITESPACE (); /* leading whitespace is part of operand. */ |
403 | c = *input_line_pointer++; /* input_line_pointer->past char in c. */ | |
c593cf41 SC |
404 | |
405 | switch (c) | |
fecd2382 | 406 | { |
2ed83a59 KR |
407 | #ifdef MRI |
408 | case '%': | |
409 | integer_constant (2, expressionP); | |
c593cf41 | 410 | break; |
2ed83a59 KR |
411 | case '@': |
412 | integer_constant (8, expressionP); | |
c593cf41 | 413 | break; |
2ed83a59 KR |
414 | case '$': |
415 | integer_constant (16, expressionP); | |
c593cf41 | 416 | break; |
2ed83a59 | 417 | #endif |
c593cf41 SC |
418 | case '1': |
419 | case '2': | |
420 | case '3': | |
421 | case '4': | |
422 | case '5': | |
423 | case '6': | |
424 | case '7': | |
2ed83a59 KR |
425 | case '8': |
426 | case '9': | |
427 | input_line_pointer--; | |
428 | ||
429 | integer_constant (10, expressionP); | |
c593cf41 SC |
430 | break; |
431 | ||
2ed83a59 KR |
432 | case '0': |
433 | /* non-decimal radix */ | |
434 | ||
2ed83a59 KR |
435 | c = *input_line_pointer; |
436 | switch (c) | |
437 | { | |
438 | ||
439 | default: | |
440 | if (c && strchr (FLT_CHARS, c)) | |
441 | { | |
442 | input_line_pointer++; | |
443 | floating_constant (expressionP); | |
7691379e | 444 | expressionP->X_add_number = -(isupper (c) ? tolower (c) : c); |
2ed83a59 KR |
445 | } |
446 | else | |
447 | { | |
448 | /* The string was only zero */ | |
5ac34ac3 | 449 | expressionP->X_op = O_constant; |
2ed83a59 | 450 | expressionP->X_add_number = 0; |
2ed83a59 KR |
451 | } |
452 | ||
453 | break; | |
454 | ||
455 | case 'x': | |
456 | case 'X': | |
457 | input_line_pointer++; | |
458 | integer_constant (16, expressionP); | |
459 | break; | |
460 | ||
461 | case 'b': | |
462 | #ifdef LOCAL_LABELS_FB | |
7691379e KR |
463 | if (!input_line_pointer[1] |
464 | /* Strictly speaking, we should only need to check for | |
465 | "+-01", since that's all you'd normally have in a | |
466 | binary constant. But some of our code does permit | |
467 | digits greater than the base we're expecting. */ | |
468 | || !strchr ("+-0123456789", input_line_pointer[1])) | |
2ed83a59 KR |
469 | { |
470 | input_line_pointer--; | |
471 | integer_constant (10, expressionP); | |
472 | break; | |
473 | } | |
474 | #endif | |
475 | case 'B': | |
476 | input_line_pointer++; | |
477 | integer_constant (2, expressionP); | |
478 | break; | |
479 | ||
480 | case '0': | |
481 | case '1': | |
482 | case '2': | |
483 | case '3': | |
484 | case '4': | |
485 | case '5': | |
486 | case '6': | |
487 | case '7': | |
488 | integer_constant (8, expressionP); | |
489 | break; | |
490 | ||
491 | case 'f': | |
492 | #ifdef LOCAL_LABELS_FB | |
493 | /* if it says '0f' and the line ends or it doesn't look like | |
d841bc49 | 494 | a floating point #, its a local label ref. dtrt */ |
2ed83a59 KR |
495 | /* likewise for the b's. xoxorich. */ |
496 | if (c == 'f' | |
7691379e KR |
497 | && (!input_line_pointer[1] |
498 | || (!strchr ("+-.0123456789", input_line_pointer[1]) | |
499 | && !strchr (EXP_CHARS, input_line_pointer[1])))) | |
2ed83a59 KR |
500 | { |
501 | input_line_pointer -= 1; | |
502 | integer_constant (10, expressionP); | |
503 | break; | |
504 | } | |
505 | #endif | |
506 | ||
507 | case 'd': | |
508 | case 'D': | |
509 | case 'F': | |
510 | case 'r': | |
511 | case 'e': | |
512 | case 'E': | |
513 | case 'g': | |
514 | case 'G': | |
515 | ||
516 | input_line_pointer++; | |
517 | floating_constant (expressionP); | |
f2f7d044 | 518 | expressionP->X_add_number = -(isupper (c) ? tolower (c) : c); |
2ed83a59 KR |
519 | break; |
520 | ||
521 | #ifdef LOCAL_LABELS_DOLLAR | |
522 | case '$': | |
523 | integer_constant (10, expressionP); | |
524 | break; | |
525 | #endif | |
526 | } | |
527 | ||
c593cf41 | 528 | break; |
5ac34ac3 | 529 | |
2ed83a59 KR |
530 | case '(': |
531 | /* didn't begin with digit & not a name */ | |
58d4951d | 532 | segment = expression (expressionP); |
5ac34ac3 ILT |
533 | /* Expression() will pass trailing whitespace */ |
534 | if (*input_line_pointer++ != ')') | |
535 | { | |
536 | as_bad ("Missing ')' assumed"); | |
537 | input_line_pointer--; | |
538 | } | |
539 | /* here with input_line_pointer->char after "(...)" */ | |
58d4951d | 540 | return segment; |
c593cf41 | 541 | |
2ed83a59 | 542 | case '\'': |
d841bc49 KR |
543 | /* Warning: to conform to other people's assemblers NO ESCAPEMENT is |
544 | permitted for a single quote. The next character, parity errors and | |
545 | all, is taken as the value of the operand. VERY KINKY. */ | |
5ac34ac3 | 546 | expressionP->X_op = O_constant; |
2ed83a59 | 547 | expressionP->X_add_number = *input_line_pointer++; |
2ed83a59 KR |
548 | break; |
549 | ||
49864cfa | 550 | case '+': |
58d4951d | 551 | (void) operand (expressionP); |
49864cfa KR |
552 | break; |
553 | ||
2ed83a59 KR |
554 | case '~': |
555 | case '-': | |
2ed83a59 | 556 | { |
5ac34ac3 ILT |
557 | operand (expressionP); |
558 | if (expressionP->X_op == O_constant) | |
2ed83a59 | 559 | { |
2ed83a59 KR |
560 | /* input_line_pointer -> char after operand */ |
561 | if (c == '-') | |
562 | { | |
5ac34ac3 | 563 | expressionP->X_add_number = - expressionP->X_add_number; |
d841bc49 KR |
564 | /* Notice: '-' may overflow: no warning is given. This is |
565 | compatible with other people's assemblers. Sigh. */ | |
d4c8cbd8 | 566 | expressionP->X_unsigned = 0; |
2ed83a59 KR |
567 | } |
568 | else | |
5ac34ac3 | 569 | expressionP->X_add_number = ~ expressionP->X_add_number; |
f2f7d044 | 570 | } |
5ac34ac3 ILT |
571 | else if (expressionP->X_op != O_illegal |
572 | && expressionP->X_op != O_absent) | |
f2f7d044 | 573 | { |
5ac34ac3 | 574 | expressionP->X_add_symbol = make_expr_symbol (expressionP); |
2ed83a59 | 575 | if (c == '-') |
5ac34ac3 | 576 | expressionP->X_op = O_uminus; |
f2f7d044 | 577 | else |
5ac34ac3 ILT |
578 | expressionP->X_op = O_bit_not; |
579 | expressionP->X_add_number = 0; | |
c593cf41 | 580 | } |
f2f7d044 | 581 | else |
5ac34ac3 ILT |
582 | as_warn ("Unary operator %c ignored because bad operand follows", |
583 | c); | |
c593cf41 | 584 | } |
2ed83a59 KR |
585 | break; |
586 | ||
587 | case '.': | |
588 | if (!is_part_of_name (*input_line_pointer)) | |
589 | { | |
5ac34ac3 | 590 | const char *fake; |
2ed83a59 | 591 | |
85825401 ILT |
592 | /* JF: '.' is pseudo symbol with value of current location |
593 | in current segment. */ | |
d4c8cbd8 | 594 | fake = FAKE_LABEL_NAME; |
85825401 | 595 | symbolP = symbol_new (fake, |
2ed83a59 | 596 | now_seg, |
5ac34ac3 | 597 | (valueT) frag_now_fix (), |
2ed83a59 | 598 | frag_now); |
c593cf41 | 599 | |
5ac34ac3 | 600 | expressionP->X_op = O_symbol; |
2ed83a59 | 601 | expressionP->X_add_symbol = symbolP; |
5ac34ac3 | 602 | expressionP->X_add_number = 0; |
2ed83a59 | 603 | break; |
2ed83a59 KR |
604 | } |
605 | else | |
606 | { | |
607 | goto isname; | |
2ed83a59 KR |
608 | } |
609 | case ',': | |
610 | case '\n': | |
f2f7d044 | 611 | case '\0': |
0bd77bc4 | 612 | eol: |
2ed83a59 | 613 | /* can't imagine any other kind of operand */ |
5ac34ac3 | 614 | expressionP->X_op = O_absent; |
2ed83a59 KR |
615 | input_line_pointer--; |
616 | md_operand (expressionP); | |
617 | break; | |
0bd77bc4 | 618 | |
2ed83a59 | 619 | default: |
58d4951d | 620 | if (is_end_of_line[(unsigned char) c]) |
0bd77bc4 | 621 | goto eol; |
2ed83a59 KR |
622 | if (is_name_beginner (c)) /* here if did not begin with a digit */ |
623 | { | |
624 | /* | |
d841bc49 KR |
625 | * Identifier begins here. |
626 | * This is kludged for speed, so code is repeated. | |
627 | */ | |
2ed83a59 KR |
628 | isname: |
629 | name = --input_line_pointer; | |
630 | c = get_symbol_end (); | |
631 | symbolP = symbol_find_or_make (name); | |
5ac34ac3 ILT |
632 | |
633 | /* If we have an absolute symbol or a reg, then we know its | |
634 | value now. */ | |
58d4951d ILT |
635 | segment = S_GET_SEGMENT (symbolP); |
636 | if (segment == absolute_section) | |
5ac34ac3 ILT |
637 | { |
638 | expressionP->X_op = O_constant; | |
639 | expressionP->X_add_number = S_GET_VALUE (symbolP); | |
640 | } | |
58d4951d | 641 | else if (segment == reg_section) |
5ac34ac3 ILT |
642 | { |
643 | expressionP->X_op = O_register; | |
644 | expressionP->X_add_number = S_GET_VALUE (symbolP); | |
645 | } | |
f2f7d044 | 646 | else |
2ed83a59 | 647 | { |
5ac34ac3 | 648 | expressionP->X_op = O_symbol; |
2ed83a59 | 649 | expressionP->X_add_symbol = symbolP; |
5ac34ac3 | 650 | expressionP->X_add_number = 0; |
2ed83a59 KR |
651 | } |
652 | *input_line_pointer = c; | |
2ed83a59 KR |
653 | } |
654 | else | |
655 | { | |
656 | as_bad ("Bad expression"); | |
5ac34ac3 | 657 | expressionP->X_op = O_constant; |
2ed83a59 | 658 | expressionP->X_add_number = 0; |
2ed83a59 | 659 | } |
c593cf41 | 660 | } |
c593cf41 | 661 | |
c593cf41 SC |
662 | /* |
663 | * It is more 'efficient' to clean up the expressionS when they are created. | |
664 | * Doing it here saves lines of code. | |
665 | */ | |
666 | clean_up_expression (expressionP); | |
2ed83a59 KR |
667 | SKIP_WHITESPACE (); /*->1st char after operand. */ |
668 | know (*input_line_pointer != ' '); | |
58d4951d | 669 | |
009dc5e1 JL |
670 | /* The PA port needs this information. */ |
671 | if (expressionP->X_add_symbol) | |
672 | expressionP->X_add_symbol->sy_used = 1; | |
673 | ||
58d4951d ILT |
674 | switch (expressionP->X_op) |
675 | { | |
676 | default: | |
677 | return absolute_section; | |
678 | case O_symbol: | |
679 | return S_GET_SEGMENT (expressionP->X_add_symbol); | |
680 | case O_register: | |
681 | return reg_section; | |
682 | } | |
2ed83a59 | 683 | } /* operand() */ |
fecd2382 RP |
684 | \f |
685 | /* Internal. Simplify a struct expression for use by expr() */ | |
686 | ||
687 | /* | |
688 | * In: address of a expressionS. | |
5ac34ac3 | 689 | * The X_op field of the expressionS may only take certain values. |
fecd2382 RP |
690 | * Elsewise we waste time special-case testing. Sigh. Ditto SEG_ABSENT. |
691 | * Out: expressionS may have been modified: | |
692 | * 'foo-foo' symbol references cancelled to 0, | |
5ac34ac3 | 693 | * which changes X_op from O_subtract to O_constant. |
fecd2382 RP |
694 | * Unused fields zeroed to help expr(). |
695 | */ | |
696 | ||
697 | static void | |
c593cf41 | 698 | clean_up_expression (expressionP) |
dae92eab | 699 | expressionS *expressionP; |
fecd2382 | 700 | { |
5ac34ac3 | 701 | switch (expressionP->X_op) |
2ed83a59 | 702 | { |
5ac34ac3 ILT |
703 | case O_illegal: |
704 | case O_absent: | |
2ed83a59 | 705 | expressionP->X_add_number = 0; |
5ac34ac3 ILT |
706 | /* Fall through. */ |
707 | case O_big: | |
708 | case O_constant: | |
709 | case O_register: | |
2ed83a59 | 710 | expressionP->X_add_symbol = NULL; |
5ac34ac3 ILT |
711 | /* Fall through. */ |
712 | case O_symbol: | |
713 | case O_uminus: | |
714 | case O_bit_not: | |
715 | expressionP->X_op_symbol = NULL; | |
716 | break; | |
717 | case O_subtract: | |
718 | if (expressionP->X_op_symbol == expressionP->X_add_symbol | |
719 | || ((expressionP->X_op_symbol->sy_frag | |
720 | == expressionP->X_add_symbol->sy_frag) | |
ffffc8fb | 721 | && SEG_NORMAL (S_GET_SEGMENT (expressionP->X_add_symbol)) |
5ac34ac3 | 722 | && (S_GET_VALUE (expressionP->X_op_symbol) |
49864cfa | 723 | == S_GET_VALUE (expressionP->X_add_symbol)))) |
2ed83a59 | 724 | { |
5ac34ac3 | 725 | expressionP->X_op = O_constant; |
2ed83a59 | 726 | expressionP->X_add_symbol = NULL; |
5ac34ac3 | 727 | expressionP->X_op_symbol = NULL; |
fecd2382 | 728 | } |
5ac34ac3 ILT |
729 | break; |
730 | default: | |
731 | break; | |
fecd2382 | 732 | } |
f2f7d044 | 733 | } |
fecd2382 RP |
734 | \f |
735 | /* Expression parser. */ | |
736 | ||
737 | /* | |
738 | * We allow an empty expression, and just assume (absolute,0) silently. | |
739 | * Unary operators and parenthetical expressions are treated as operands. | |
740 | * As usual, Q==quantity==operand, O==operator, X==expression mnemonics. | |
741 | * | |
742 | * We used to do a aho/ullman shift-reduce parser, but the logic got so | |
743 | * warped that I flushed it and wrote a recursive-descent parser instead. | |
744 | * Now things are stable, would anybody like to write a fast parser? | |
745 | * Most expressions are either register (which does not even reach here) | |
746 | * or 1 symbol. Then "symbol+constant" and "symbol-symbol" are common. | |
747 | * So I guess it doesn't really matter how inefficient more complex expressions | |
748 | * are parsed. | |
749 | * | |
750 | * After expr(RANK,resultP) input_line_pointer->operator of rank <= RANK. | |
751 | * Also, we have consumed any leading or trailing spaces (operand does that) | |
752 | * and done all intervening operators. | |
5ac34ac3 ILT |
753 | * |
754 | * This returns the segment of the result, which will be | |
755 | * absolute_section or the segment of a symbol. | |
fecd2382 RP |
756 | */ |
757 | ||
49864cfa | 758 | #undef __ |
fecd2382 RP |
759 | #define __ O_illegal |
760 | ||
2ed83a59 KR |
761 | static const operatorT op_encoding[256] = |
762 | { /* maps ASCII->operators */ | |
763 | ||
764 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, | |
765 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, | |
766 | ||
767 | __, O_bit_or_not, __, __, __, O_modulus, O_bit_and, __, | |
768 | __, __, O_multiply, O_add, __, O_subtract, __, O_divide, | |
769 | __, __, __, __, __, __, __, __, | |
770 | __, __, __, __, O_left_shift, __, O_right_shift, __, | |
771 | __, __, __, __, __, __, __, __, | |
772 | __, __, __, __, __, __, __, __, | |
773 | __, __, __, __, __, __, __, __, | |
774 | __, __, __, __, __, __, O_bit_exclusive_or, __, | |
775 | __, __, __, __, __, __, __, __, | |
776 | __, __, __, __, __, __, __, __, | |
777 | __, __, __, __, __, __, __, __, | |
778 | __, __, __, __, O_bit_inclusive_or, __, __, __, | |
779 | ||
780 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, | |
781 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, | |
782 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, | |
783 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, | |
784 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, | |
785 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, | |
786 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, | |
787 | __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __ | |
788 | }; | |
fecd2382 RP |
789 | |
790 | ||
791 | /* | |
792 | * Rank Examples | |
793 | * 0 operand, (expression) | |
794 | * 1 + - | |
795 | * 2 & ^ ! | | |
796 | * 3 * / % << >> | |
5ac34ac3 | 797 | * 4 unary - unary ~ |
fecd2382 | 798 | */ |
5ac34ac3 ILT |
799 | static const operator_rankT op_rank[] = |
800 | { | |
801 | 0, /* O_illegal */ | |
802 | 0, /* O_absent */ | |
803 | 0, /* O_constant */ | |
804 | 0, /* O_symbol */ | |
805 | 0, /* O_register */ | |
806 | 0, /* O_bit */ | |
807 | 4, /* O_uminus */ | |
808 | 4, /* O_bit_now */ | |
809 | 3, /* O_multiply */ | |
810 | 3, /* O_divide */ | |
811 | 3, /* O_modulus */ | |
812 | 3, /* O_left_shift */ | |
813 | 3, /* O_right_shift */ | |
814 | 2, /* O_bit_inclusive_or */ | |
815 | 2, /* O_bit_or_not */ | |
816 | 2, /* O_bit_exclusive_or */ | |
817 | 2, /* O_bit_and */ | |
818 | 1, /* O_add */ | |
819 | 1, /* O_subtract */ | |
820 | }; | |
fecd2382 | 821 | \f |
5ac34ac3 | 822 | segT |
2ed83a59 | 823 | expr (rank, resultP) |
dae92eab KR |
824 | operator_rankT rank; /* Larger # is higher rank. */ |
825 | expressionS *resultP; /* Deliver result here. */ | |
fecd2382 | 826 | { |
5ac34ac3 | 827 | segT retval; |
2ed83a59 | 828 | expressionS right; |
dae92eab KR |
829 | operatorT op_left; |
830 | char c_left; /* 1st operator character. */ | |
831 | operatorT op_right; | |
832 | char c_right; | |
c593cf41 | 833 | |
2ed83a59 | 834 | know (rank >= 0); |
5ac34ac3 ILT |
835 | |
836 | retval = operand (resultP); | |
837 | ||
2ed83a59 | 838 | know (*input_line_pointer != ' '); /* Operand() gobbles spaces. */ |
5ac34ac3 | 839 | |
2ed83a59 | 840 | c_left = *input_line_pointer; /* Potential operator character. */ |
58d4951d | 841 | op_left = op_encoding[(unsigned char) c_left]; |
2ed83a59 | 842 | while (op_left != O_illegal && op_rank[(int) op_left] > rank) |
fecd2382 | 843 | { |
5ac34ac3 ILT |
844 | segT rightseg; |
845 | ||
2ed83a59 KR |
846 | input_line_pointer++; /*->after 1st character of operator. */ |
847 | /* Operators "<<" and ">>" have 2 characters. */ | |
848 | if (*input_line_pointer == c_left && (c_left == '<' || c_left == '>')) | |
5ac34ac3 ILT |
849 | ++input_line_pointer; |
850 | ||
851 | rightseg = expr (op_rank[(int) op_left], &right); | |
852 | if (right.X_op == O_absent) | |
fecd2382 | 853 | { |
5ac34ac3 ILT |
854 | as_warn ("missing operand; zero assumed"); |
855 | right.X_op = O_constant; | |
856 | right.X_add_number = 0; | |
d4c8cbd8 JL |
857 | right.X_add_symbol = NULL; |
858 | right.X_op_symbol = NULL; | |
fecd2382 | 859 | } |
5ac34ac3 | 860 | |
2ed83a59 | 861 | know (*input_line_pointer != ' '); |
5ac34ac3 | 862 | |
58d4951d ILT |
863 | if (retval == undefined_section) |
864 | { | |
865 | if (SEG_NORMAL (rightseg)) | |
866 | retval = rightseg; | |
867 | } | |
868 | else if (! SEG_NORMAL (retval)) | |
5ac34ac3 ILT |
869 | retval = rightseg; |
870 | else if (SEG_NORMAL (rightseg) | |
d4c8cbd8 JL |
871 | && retval != rightseg |
872 | #ifdef DIFF_EXPR_OK | |
873 | && op_left != O_subtract | |
874 | #endif | |
875 | ) | |
5ac34ac3 ILT |
876 | as_bad ("operation combines symbols in different segments"); |
877 | ||
2ed83a59 | 878 | c_right = *input_line_pointer; |
58d4951d | 879 | op_right = op_encoding[(unsigned char) c_right]; |
2ed83a59 | 880 | if (*input_line_pointer == c_right && (c_right == '<' || c_right == '>')) |
5ac34ac3 ILT |
881 | ++input_line_pointer; |
882 | ||
883 | know (op_right == O_illegal || op_rank[(int) op_right] <= op_rank[(int) op_left]); | |
884 | know ((int) op_left >= (int) O_multiply && (int) op_left <= (int) O_subtract); | |
885 | ||
c593cf41 SC |
886 | /* input_line_pointer->after right-hand quantity. */ |
887 | /* left-hand quantity in resultP */ | |
888 | /* right-hand quantity in right. */ | |
889 | /* operator in op_left. */ | |
5ac34ac3 ILT |
890 | |
891 | if (resultP->X_op == O_big) | |
fecd2382 | 892 | { |
5ac34ac3 ILT |
893 | as_warn ("left operand of %c is a %s; integer 0 assumed", |
894 | c_left, resultP->X_add_number > 0 ? "bignum" : "float"); | |
895 | resultP->X_op = O_constant; | |
896 | resultP->X_add_number = 0; | |
897 | resultP->X_add_symbol = NULL; | |
898 | resultP->X_op_symbol = NULL; | |
fecd2382 | 899 | } |
5ac34ac3 | 900 | if (right.X_op == O_big) |
fecd2382 | 901 | { |
5ac34ac3 ILT |
902 | as_warn ("right operand of %c is a %s; integer 0 assumed", |
903 | c_left, right.X_add_number > 0 ? "bignum" : "float"); | |
904 | right.X_op = O_constant; | |
905 | right.X_add_number = 0; | |
906 | right.X_add_symbol = NULL; | |
907 | right.X_op_symbol = NULL; | |
908 | } | |
909 | ||
910 | /* Optimize common cases. */ | |
911 | if (op_left == O_add && right.X_op == O_constant) | |
912 | { | |
913 | /* X + constant. */ | |
914 | resultP->X_add_number += right.X_add_number; | |
915 | } | |
916 | else if (op_left == O_subtract && right.X_op == O_constant) | |
917 | { | |
918 | /* X - constant. */ | |
919 | resultP->X_add_number -= right.X_add_number; | |
920 | } | |
921 | else if (op_left == O_add && resultP->X_op == O_constant) | |
922 | { | |
923 | /* Constant + X. */ | |
924 | resultP->X_op = right.X_op; | |
925 | resultP->X_add_symbol = right.X_add_symbol; | |
926 | resultP->X_op_symbol = right.X_op_symbol; | |
927 | resultP->X_add_number += right.X_add_number; | |
928 | retval = rightseg; | |
929 | } | |
930 | else if (resultP->X_op == O_constant && right.X_op == O_constant) | |
931 | { | |
932 | /* Constant OP constant. */ | |
933 | offsetT v = right.X_add_number; | |
934 | if (v == 0 && (op_left == O_divide || op_left == O_modulus)) | |
fecd2382 | 935 | { |
5ac34ac3 ILT |
936 | as_warn ("division by zero"); |
937 | v = 1; | |
fecd2382 | 938 | } |
5ac34ac3 | 939 | switch (op_left) |
fecd2382 | 940 | { |
5ac34ac3 ILT |
941 | case O_multiply: resultP->X_add_number *= v; break; |
942 | case O_divide: resultP->X_add_number /= v; break; | |
943 | case O_modulus: resultP->X_add_number %= v; break; | |
944 | case O_left_shift: resultP->X_add_number <<= v; break; | |
945 | case O_right_shift: resultP->X_add_number >>= v; break; | |
946 | case O_bit_inclusive_or: resultP->X_add_number |= v; break; | |
947 | case O_bit_or_not: resultP->X_add_number |= ~v; break; | |
948 | case O_bit_exclusive_or: resultP->X_add_number ^= v; break; | |
949 | case O_bit_and: resultP->X_add_number &= v; break; | |
950 | case O_add: resultP->X_add_number += v; break; | |
951 | case O_subtract: resultP->X_add_number -= v; break; | |
952 | default: abort (); | |
fecd2382 | 953 | } |
5ac34ac3 ILT |
954 | } |
955 | else if (resultP->X_op == O_symbol | |
956 | && right.X_op == O_symbol | |
957 | && (op_left == O_add | |
958 | || op_left == O_subtract | |
959 | || (resultP->X_add_number == 0 | |
960 | && right.X_add_number == 0))) | |
961 | { | |
962 | /* Symbol OP symbol. */ | |
963 | resultP->X_op = op_left; | |
964 | resultP->X_op_symbol = right.X_add_symbol; | |
c593cf41 | 965 | if (op_left == O_add) |
5ac34ac3 ILT |
966 | resultP->X_add_number += right.X_add_number; |
967 | else if (op_left == O_subtract) | |
968 | resultP->X_add_number -= right.X_add_number; | |
969 | } | |
970 | else | |
971 | { | |
972 | /* The general case. */ | |
973 | resultP->X_add_symbol = make_expr_symbol (resultP); | |
974 | resultP->X_op_symbol = make_expr_symbol (&right); | |
975 | resultP->X_op = op_left; | |
976 | resultP->X_add_number = 0; | |
d4c8cbd8 | 977 | resultP->X_unsigned = 1; |
5ac34ac3 | 978 | } |
351878df | 979 | |
2ed83a59 | 980 | op_left = op_right; |
fecd2382 | 981 | } /* While next operator is >= this rank. */ |
5ac34ac3 | 982 | |
009dc5e1 JL |
983 | /* The PA port needs this information. */ |
984 | if (resultP->X_add_symbol) | |
985 | resultP->X_add_symbol->sy_used = 1; | |
986 | ||
5ac34ac3 | 987 | return resultP->X_op == O_constant ? absolute_section : retval; |
fecd2382 RP |
988 | } |
989 | \f | |
990 | /* | |
991 | * get_symbol_end() | |
992 | * | |
993 | * This lives here because it belongs equally in expr.c & read.c. | |
994 | * Expr.c is just a branch office read.c anyway, and putting it | |
995 | * here lessens the crowd at read.c. | |
996 | * | |
997 | * Assume input_line_pointer is at start of symbol name. | |
998 | * Advance input_line_pointer past symbol name. | |
999 | * Turn that character into a '\0', returning its former value. | |
1000 | * This allows a string compare (RMS wants symbol names to be strings) | |
1001 | * of the symbol name. | |
1002 | * There will always be a char following symbol name, because all good | |
1003 | * lines end in end-of-line. | |
1004 | */ | |
1005 | char | |
2ed83a59 | 1006 | get_symbol_end () |
fecd2382 | 1007 | { |
dae92eab | 1008 | char c; |
2ed83a59 KR |
1009 | |
1010 | while (is_part_of_name (c = *input_line_pointer++)) | |
1011 | ; | |
1012 | *--input_line_pointer = 0; | |
1013 | return (c); | |
fecd2382 RP |
1014 | } |
1015 | ||
a39116f1 | 1016 | |
351878df | 1017 | unsigned int |
2ed83a59 | 1018 | get_single_number () |
a39116f1 | 1019 | { |
2ed83a59 KR |
1020 | expressionS exp; |
1021 | operand (&exp); | |
1022 | return exp.X_add_number; | |
1023 | ||
a39116f1 | 1024 | } |
2ed83a59 | 1025 | |
8b228fe9 | 1026 | /* end of expr.c */ |