PR rtl-optimization/20370
[official-gcc.git] / gcc / stmt.c
blobe38b96b6c293eb8d86a1cb9347534389056f9c8e
1 /* Expands front end tree to back end RTL for GCC
2 Copyright (C) 1987, 1988, 1989, 1992, 1993, 1994, 1995, 1996, 1997,
3 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005
4 Free Software Foundation, Inc.
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 2, or (at your option) any later
11 version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING. If not, write to the Free
20 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
21 02110-1301, USA. */
23 /* This file handles the generation of rtl code from tree structure
24 above the level of expressions, using subroutines in exp*.c and emit-rtl.c.
25 The functions whose names start with `expand_' are called by the
26 expander to generate RTL instructions for various kinds of constructs. */
28 #include "config.h"
29 #include "system.h"
30 #include "coretypes.h"
31 #include "tm.h"
33 #include "rtl.h"
34 #include "hard-reg-set.h"
35 #include "tree.h"
36 #include "tm_p.h"
37 #include "flags.h"
38 #include "except.h"
39 #include "function.h"
40 #include "insn-config.h"
41 #include "expr.h"
42 #include "libfuncs.h"
43 #include "recog.h"
44 #include "machmode.h"
45 #include "toplev.h"
46 #include "output.h"
47 #include "ggc.h"
48 #include "langhooks.h"
49 #include "predict.h"
50 #include "optabs.h"
51 #include "target.h"
52 #include "regs.h"
54 /* Functions and data structures for expanding case statements. */
56 /* Case label structure, used to hold info on labels within case
57 statements. We handle "range" labels; for a single-value label
58 as in C, the high and low limits are the same.
60 We start with a vector of case nodes sorted in ascending order, and
61 the default label as the last element in the vector. Before expanding
62 to RTL, we transform this vector into a list linked via the RIGHT
63 fields in the case_node struct. Nodes with higher case values are
64 later in the list.
66 Switch statements can be output in three forms. A branch table is
67 used if there are more than a few labels and the labels are dense
68 within the range between the smallest and largest case value. If a
69 branch table is used, no further manipulations are done with the case
70 node chain.
72 The alternative to the use of a branch table is to generate a series
73 of compare and jump insns. When that is done, we use the LEFT, RIGHT,
74 and PARENT fields to hold a binary tree. Initially the tree is
75 totally unbalanced, with everything on the right. We balance the tree
76 with nodes on the left having lower case values than the parent
77 and nodes on the right having higher values. We then output the tree
78 in order.
80 For very small, suitable switch statements, we can generate a series
81 of simple bit test and branches instead. */
83 struct case_node GTY(())
85 struct case_node *left; /* Left son in binary tree */
86 struct case_node *right; /* Right son in binary tree; also node chain */
87 struct case_node *parent; /* Parent of node in binary tree */
88 tree low; /* Lowest index value for this label */
89 tree high; /* Highest index value for this label */
90 tree code_label; /* Label to jump to when node matches */
93 typedef struct case_node case_node;
94 typedef struct case_node *case_node_ptr;
96 /* These are used by estimate_case_costs and balance_case_nodes. */
98 /* This must be a signed type, and non-ANSI compilers lack signed char. */
99 static short cost_table_[129];
100 static int use_cost_table;
101 static int cost_table_initialized;
103 /* Special care is needed because we allow -1, but TREE_INT_CST_LOW
104 is unsigned. */
105 #define COST_TABLE(I) cost_table_[(unsigned HOST_WIDE_INT) ((I) + 1)]
107 static int n_occurrences (int, const char *);
108 static bool decl_conflicts_with_clobbers_p (tree, const HARD_REG_SET);
109 static void expand_nl_goto_receiver (void);
110 static bool check_operand_nalternatives (tree, tree);
111 static bool check_unique_operand_names (tree, tree);
112 static char *resolve_operand_name_1 (char *, tree, tree);
113 static void expand_null_return_1 (void);
114 static void expand_value_return (rtx);
115 static void do_jump_if_equal (rtx, rtx, rtx, int);
116 static int estimate_case_costs (case_node_ptr);
117 static bool lshift_cheap_p (void);
118 static int case_bit_test_cmp (const void *, const void *);
119 static void emit_case_bit_tests (tree, tree, tree, tree, case_node_ptr, rtx);
120 static void balance_case_nodes (case_node_ptr *, case_node_ptr);
121 static int node_has_low_bound (case_node_ptr, tree);
122 static int node_has_high_bound (case_node_ptr, tree);
123 static int node_is_bounded (case_node_ptr, tree);
124 static void emit_case_nodes (rtx, case_node_ptr, rtx, tree);
125 static struct case_node *add_case_node (struct case_node *, tree,
126 tree, tree, tree);
129 /* Return the rtx-label that corresponds to a LABEL_DECL,
130 creating it if necessary. */
133 label_rtx (tree label)
135 gcc_assert (TREE_CODE (label) == LABEL_DECL);
137 if (!DECL_RTL_SET_P (label))
139 rtx r = gen_label_rtx ();
140 SET_DECL_RTL (label, r);
141 if (FORCED_LABEL (label) || DECL_NONLOCAL (label))
142 LABEL_PRESERVE_P (r) = 1;
145 return DECL_RTL (label);
148 /* As above, but also put it on the forced-reference list of the
149 function that contains it. */
151 force_label_rtx (tree label)
153 rtx ref = label_rtx (label);
154 tree function = decl_function_context (label);
155 struct function *p;
157 gcc_assert (function);
159 if (function != current_function_decl)
160 p = find_function_data (function);
161 else
162 p = cfun;
164 p->expr->x_forced_labels = gen_rtx_EXPR_LIST (VOIDmode, ref,
165 p->expr->x_forced_labels);
166 return ref;
169 /* Add an unconditional jump to LABEL as the next sequential instruction. */
171 void
172 emit_jump (rtx label)
174 do_pending_stack_adjust ();
175 emit_jump_insn (gen_jump (label));
176 emit_barrier ();
179 /* Emit code to jump to the address
180 specified by the pointer expression EXP. */
182 void
183 expand_computed_goto (tree exp)
185 rtx x = expand_expr (exp, NULL_RTX, VOIDmode, 0);
187 x = convert_memory_address (Pmode, x);
189 do_pending_stack_adjust ();
190 emit_indirect_jump (x);
193 /* Handle goto statements and the labels that they can go to. */
195 /* Specify the location in the RTL code of a label LABEL,
196 which is a LABEL_DECL tree node.
198 This is used for the kind of label that the user can jump to with a
199 goto statement, and for alternatives of a switch or case statement.
200 RTL labels generated for loops and conditionals don't go through here;
201 they are generated directly at the RTL level, by other functions below.
203 Note that this has nothing to do with defining label *names*.
204 Languages vary in how they do that and what that even means. */
206 void
207 expand_label (tree label)
209 rtx label_r = label_rtx (label);
211 do_pending_stack_adjust ();
212 emit_label (label_r);
213 if (DECL_NAME (label))
214 LABEL_NAME (DECL_RTL (label)) = IDENTIFIER_POINTER (DECL_NAME (label));
216 if (DECL_NONLOCAL (label))
218 expand_nl_goto_receiver ();
219 nonlocal_goto_handler_labels
220 = gen_rtx_EXPR_LIST (VOIDmode, label_r,
221 nonlocal_goto_handler_labels);
224 if (FORCED_LABEL (label))
225 forced_labels = gen_rtx_EXPR_LIST (VOIDmode, label_r, forced_labels);
227 if (DECL_NONLOCAL (label) || FORCED_LABEL (label))
228 maybe_set_first_label_num (label_r);
231 /* Generate RTL code for a `goto' statement with target label LABEL.
232 LABEL should be a LABEL_DECL tree node that was or will later be
233 defined with `expand_label'. */
235 void
236 expand_goto (tree label)
238 #ifdef ENABLE_CHECKING
239 /* Check for a nonlocal goto to a containing function. Should have
240 gotten translated to __builtin_nonlocal_goto. */
241 tree context = decl_function_context (label);
242 gcc_assert (!context || context == current_function_decl);
243 #endif
245 emit_jump (label_rtx (label));
248 /* Return the number of times character C occurs in string S. */
249 static int
250 n_occurrences (int c, const char *s)
252 int n = 0;
253 while (*s)
254 n += (*s++ == c);
255 return n;
258 /* Generate RTL for an asm statement (explicit assembler code).
259 STRING is a STRING_CST node containing the assembler code text,
260 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
261 insn is volatile; don't optimize it. */
263 static void
264 expand_asm (tree string, int vol)
266 rtx body;
268 if (TREE_CODE (string) == ADDR_EXPR)
269 string = TREE_OPERAND (string, 0);
271 body = gen_rtx_ASM_INPUT (VOIDmode,
272 ggc_strdup (TREE_STRING_POINTER (string)));
274 MEM_VOLATILE_P (body) = vol;
276 emit_insn (body);
279 /* Parse the output constraint pointed to by *CONSTRAINT_P. It is the
280 OPERAND_NUMth output operand, indexed from zero. There are NINPUTS
281 inputs and NOUTPUTS outputs to this extended-asm. Upon return,
282 *ALLOWS_MEM will be TRUE iff the constraint allows the use of a
283 memory operand. Similarly, *ALLOWS_REG will be TRUE iff the
284 constraint allows the use of a register operand. And, *IS_INOUT
285 will be true if the operand is read-write, i.e., if it is used as
286 an input as well as an output. If *CONSTRAINT_P is not in
287 canonical form, it will be made canonical. (Note that `+' will be
288 replaced with `=' as part of this process.)
290 Returns TRUE if all went well; FALSE if an error occurred. */
292 bool
293 parse_output_constraint (const char **constraint_p, int operand_num,
294 int ninputs, int noutputs, bool *allows_mem,
295 bool *allows_reg, bool *is_inout)
297 const char *constraint = *constraint_p;
298 const char *p;
300 /* Assume the constraint doesn't allow the use of either a register
301 or memory. */
302 *allows_mem = false;
303 *allows_reg = false;
305 /* Allow the `=' or `+' to not be at the beginning of the string,
306 since it wasn't explicitly documented that way, and there is a
307 large body of code that puts it last. Swap the character to
308 the front, so as not to uglify any place else. */
309 p = strchr (constraint, '=');
310 if (!p)
311 p = strchr (constraint, '+');
313 /* If the string doesn't contain an `=', issue an error
314 message. */
315 if (!p)
317 error ("output operand constraint lacks %<=%>");
318 return false;
321 /* If the constraint begins with `+', then the operand is both read
322 from and written to. */
323 *is_inout = (*p == '+');
325 /* Canonicalize the output constraint so that it begins with `='. */
326 if (p != constraint || *is_inout)
328 char *buf;
329 size_t c_len = strlen (constraint);
331 if (p != constraint)
332 warning (0, "output constraint %qc for operand %d "
333 "is not at the beginning",
334 *p, operand_num);
336 /* Make a copy of the constraint. */
337 buf = alloca (c_len + 1);
338 strcpy (buf, constraint);
339 /* Swap the first character and the `=' or `+'. */
340 buf[p - constraint] = buf[0];
341 /* Make sure the first character is an `='. (Until we do this,
342 it might be a `+'.) */
343 buf[0] = '=';
344 /* Replace the constraint with the canonicalized string. */
345 *constraint_p = ggc_alloc_string (buf, c_len);
346 constraint = *constraint_p;
349 /* Loop through the constraint string. */
350 for (p = constraint + 1; *p; p += CONSTRAINT_LEN (*p, p))
351 switch (*p)
353 case '+':
354 case '=':
355 error ("operand constraint contains incorrectly positioned "
356 "%<+%> or %<=%>");
357 return false;
359 case '%':
360 if (operand_num + 1 == ninputs + noutputs)
362 error ("%<%%%> constraint used with last operand");
363 return false;
365 break;
367 case 'V': case 'm': case 'o':
368 *allows_mem = true;
369 break;
371 case '?': case '!': case '*': case '&': case '#':
372 case 'E': case 'F': case 'G': case 'H':
373 case 's': case 'i': case 'n':
374 case 'I': case 'J': case 'K': case 'L': case 'M':
375 case 'N': case 'O': case 'P': case ',':
376 break;
378 case '0': case '1': case '2': case '3': case '4':
379 case '5': case '6': case '7': case '8': case '9':
380 case '[':
381 error ("matching constraint not valid in output operand");
382 return false;
384 case '<': case '>':
385 /* ??? Before flow, auto inc/dec insns are not supposed to exist,
386 excepting those that expand_call created. So match memory
387 and hope. */
388 *allows_mem = true;
389 break;
391 case 'g': case 'X':
392 *allows_reg = true;
393 *allows_mem = true;
394 break;
396 case 'p': case 'r':
397 *allows_reg = true;
398 break;
400 default:
401 if (!ISALPHA (*p))
402 break;
403 if (REG_CLASS_FROM_CONSTRAINT (*p, p) != NO_REGS)
404 *allows_reg = true;
405 #ifdef EXTRA_CONSTRAINT_STR
406 else if (EXTRA_ADDRESS_CONSTRAINT (*p, p))
407 *allows_reg = true;
408 else if (EXTRA_MEMORY_CONSTRAINT (*p, p))
409 *allows_mem = true;
410 else
412 /* Otherwise we can't assume anything about the nature of
413 the constraint except that it isn't purely registers.
414 Treat it like "g" and hope for the best. */
415 *allows_reg = true;
416 *allows_mem = true;
418 #endif
419 break;
422 return true;
425 /* Similar, but for input constraints. */
427 bool
428 parse_input_constraint (const char **constraint_p, int input_num,
429 int ninputs, int noutputs, int ninout,
430 const char * const * constraints,
431 bool *allows_mem, bool *allows_reg)
433 const char *constraint = *constraint_p;
434 const char *orig_constraint = constraint;
435 size_t c_len = strlen (constraint);
436 size_t j;
437 bool saw_match = false;
439 /* Assume the constraint doesn't allow the use of either
440 a register or memory. */
441 *allows_mem = false;
442 *allows_reg = false;
444 /* Make sure constraint has neither `=', `+', nor '&'. */
446 for (j = 0; j < c_len; j += CONSTRAINT_LEN (constraint[j], constraint+j))
447 switch (constraint[j])
449 case '+': case '=': case '&':
450 if (constraint == orig_constraint)
452 error ("input operand constraint contains %qc", constraint[j]);
453 return false;
455 break;
457 case '%':
458 if (constraint == orig_constraint
459 && input_num + 1 == ninputs - ninout)
461 error ("%<%%%> constraint used with last operand");
462 return false;
464 break;
466 case 'V': case 'm': case 'o':
467 *allows_mem = true;
468 break;
470 case '<': case '>':
471 case '?': case '!': case '*': case '#':
472 case 'E': case 'F': case 'G': case 'H':
473 case 's': case 'i': case 'n':
474 case 'I': case 'J': case 'K': case 'L': case 'M':
475 case 'N': case 'O': case 'P': case ',':
476 break;
478 /* Whether or not a numeric constraint allows a register is
479 decided by the matching constraint, and so there is no need
480 to do anything special with them. We must handle them in
481 the default case, so that we don't unnecessarily force
482 operands to memory. */
483 case '0': case '1': case '2': case '3': case '4':
484 case '5': case '6': case '7': case '8': case '9':
486 char *end;
487 unsigned long match;
489 saw_match = true;
491 match = strtoul (constraint + j, &end, 10);
492 if (match >= (unsigned long) noutputs)
494 error ("matching constraint references invalid operand number");
495 return false;
498 /* Try and find the real constraint for this dup. Only do this
499 if the matching constraint is the only alternative. */
500 if (*end == '\0'
501 && (j == 0 || (j == 1 && constraint[0] == '%')))
503 constraint = constraints[match];
504 *constraint_p = constraint;
505 c_len = strlen (constraint);
506 j = 0;
507 /* ??? At the end of the loop, we will skip the first part of
508 the matched constraint. This assumes not only that the
509 other constraint is an output constraint, but also that
510 the '=' or '+' come first. */
511 break;
513 else
514 j = end - constraint;
515 /* Anticipate increment at end of loop. */
516 j--;
518 /* Fall through. */
520 case 'p': case 'r':
521 *allows_reg = true;
522 break;
524 case 'g': case 'X':
525 *allows_reg = true;
526 *allows_mem = true;
527 break;
529 default:
530 if (! ISALPHA (constraint[j]))
532 error ("invalid punctuation %qc in constraint", constraint[j]);
533 return false;
535 if (REG_CLASS_FROM_CONSTRAINT (constraint[j], constraint + j)
536 != NO_REGS)
537 *allows_reg = true;
538 #ifdef EXTRA_CONSTRAINT_STR
539 else if (EXTRA_ADDRESS_CONSTRAINT (constraint[j], constraint + j))
540 *allows_reg = true;
541 else if (EXTRA_MEMORY_CONSTRAINT (constraint[j], constraint + j))
542 *allows_mem = true;
543 else
545 /* Otherwise we can't assume anything about the nature of
546 the constraint except that it isn't purely registers.
547 Treat it like "g" and hope for the best. */
548 *allows_reg = true;
549 *allows_mem = true;
551 #endif
552 break;
555 if (saw_match && !*allows_reg)
556 warning (0, "matching constraint does not allow a register");
558 return true;
561 /* Return true iff there's an overlap between REGS and DECL, where DECL
562 can be an asm-declared register. */
564 bool
565 decl_overlaps_hard_reg_set_p (tree decl, const HARD_REG_SET regs)
567 if ((TREE_CODE (decl) == VAR_DECL || TREE_CODE (decl) == PARM_DECL)
568 && DECL_REGISTER (decl)
569 && REG_P (DECL_RTL (decl))
570 && REGNO (DECL_RTL (decl)) < FIRST_PSEUDO_REGISTER)
572 rtx reg = DECL_RTL (decl);
573 unsigned int regno;
575 for (regno = REGNO (reg);
576 regno < (REGNO (reg)
577 + hard_regno_nregs[REGNO (reg)][GET_MODE (reg)]);
578 regno++)
579 if (TEST_HARD_REG_BIT (regs, regno))
580 return true;
583 return false;
587 /* Check for overlap between registers marked in CLOBBERED_REGS and
588 anything inappropriate in DECL. Emit error and return TRUE for error,
589 FALSE for ok. */
591 static bool
592 decl_conflicts_with_clobbers_p (tree decl, const HARD_REG_SET clobbered_regs)
594 /* Conflicts between asm-declared register variables and the clobber
595 list are not allowed. */
596 if (decl_overlaps_hard_reg_set_p (decl, clobbered_regs))
598 error ("asm-specifier for variable %qs conflicts with asm clobber list",
599 IDENTIFIER_POINTER (DECL_NAME (decl)));
601 /* Reset registerness to stop multiple errors emitted for a single
602 variable. */
603 DECL_REGISTER (decl) = 0;
604 return true;
607 return false;
610 /* Generate RTL for an asm statement with arguments.
611 STRING is the instruction template.
612 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
613 Each output or input has an expression in the TREE_VALUE and
614 and a tree list in TREE_PURPOSE which in turn contains a constraint
615 name in TREE_VALUE (or NULL_TREE) and a constraint string
616 in TREE_PURPOSE.
617 CLOBBERS is a list of STRING_CST nodes each naming a hard register
618 that is clobbered by this insn.
620 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
621 Some elements of OUTPUTS may be replaced with trees representing temporary
622 values. The caller should copy those temporary values to the originally
623 specified lvalues.
625 VOL nonzero means the insn is volatile; don't optimize it. */
627 static void
628 expand_asm_operands (tree string, tree outputs, tree inputs,
629 tree clobbers, int vol, location_t locus)
631 rtvec argvec, constraintvec;
632 rtx body;
633 int ninputs = list_length (inputs);
634 int noutputs = list_length (outputs);
635 int ninout;
636 int nclobbers;
637 HARD_REG_SET clobbered_regs;
638 int clobber_conflict_found = 0;
639 tree tail;
640 tree t;
641 int i;
642 /* Vector of RTX's of evaluated output operands. */
643 rtx *output_rtx = alloca (noutputs * sizeof (rtx));
644 int *inout_opnum = alloca (noutputs * sizeof (int));
645 rtx *real_output_rtx = alloca (noutputs * sizeof (rtx));
646 enum machine_mode *inout_mode
647 = alloca (noutputs * sizeof (enum machine_mode));
648 const char **constraints
649 = alloca ((noutputs + ninputs) * sizeof (const char *));
650 int old_generating_concat_p = generating_concat_p;
652 /* An ASM with no outputs needs to be treated as volatile, for now. */
653 if (noutputs == 0)
654 vol = 1;
656 if (! check_operand_nalternatives (outputs, inputs))
657 return;
659 string = resolve_asm_operand_names (string, outputs, inputs);
661 /* Collect constraints. */
662 i = 0;
663 for (t = outputs; t ; t = TREE_CHAIN (t), i++)
664 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
665 for (t = inputs; t ; t = TREE_CHAIN (t), i++)
666 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
668 /* Sometimes we wish to automatically clobber registers across an asm.
669 Case in point is when the i386 backend moved from cc0 to a hard reg --
670 maintaining source-level compatibility means automatically clobbering
671 the flags register. */
672 clobbers = targetm.md_asm_clobbers (outputs, inputs, clobbers);
674 /* Count the number of meaningful clobbered registers, ignoring what
675 we would ignore later. */
676 nclobbers = 0;
677 CLEAR_HARD_REG_SET (clobbered_regs);
678 for (tail = clobbers; tail; tail = TREE_CHAIN (tail))
680 const char *regname = TREE_STRING_POINTER (TREE_VALUE (tail));
682 i = decode_reg_name (regname);
683 if (i >= 0 || i == -4)
684 ++nclobbers;
685 else if (i == -2)
686 error ("unknown register name %qs in %<asm%>", regname);
688 /* Mark clobbered registers. */
689 if (i >= 0)
691 /* Clobbering the PIC register is an error. */
692 if (i == (int) PIC_OFFSET_TABLE_REGNUM)
694 error ("PIC register %qs clobbered in %<asm%>", regname);
695 return;
698 SET_HARD_REG_BIT (clobbered_regs, i);
702 /* First pass over inputs and outputs checks validity and sets
703 mark_addressable if needed. */
705 ninout = 0;
706 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
708 tree val = TREE_VALUE (tail);
709 tree type = TREE_TYPE (val);
710 const char *constraint;
711 bool is_inout;
712 bool allows_reg;
713 bool allows_mem;
715 /* If there's an erroneous arg, emit no insn. */
716 if (type == error_mark_node)
717 return;
719 /* Try to parse the output constraint. If that fails, there's
720 no point in going further. */
721 constraint = constraints[i];
722 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
723 &allows_mem, &allows_reg, &is_inout))
724 return;
726 if (! allows_reg
727 && (allows_mem
728 || is_inout
729 || (DECL_P (val)
730 && REG_P (DECL_RTL (val))
731 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
732 lang_hooks.mark_addressable (val);
734 if (is_inout)
735 ninout++;
738 ninputs += ninout;
739 if (ninputs + noutputs > MAX_RECOG_OPERANDS)
741 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
742 return;
745 for (i = 0, tail = inputs; tail; i++, tail = TREE_CHAIN (tail))
747 bool allows_reg, allows_mem;
748 const char *constraint;
750 /* If there's an erroneous arg, emit no insn, because the ASM_INPUT
751 would get VOIDmode and that could cause a crash in reload. */
752 if (TREE_TYPE (TREE_VALUE (tail)) == error_mark_node)
753 return;
755 constraint = constraints[i + noutputs];
756 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, ninout,
757 constraints, &allows_mem, &allows_reg))
758 return;
760 if (! allows_reg && allows_mem)
761 lang_hooks.mark_addressable (TREE_VALUE (tail));
764 /* Second pass evaluates arguments. */
766 ninout = 0;
767 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
769 tree val = TREE_VALUE (tail);
770 tree type = TREE_TYPE (val);
771 bool is_inout;
772 bool allows_reg;
773 bool allows_mem;
774 rtx op;
775 bool ok;
777 ok = parse_output_constraint (&constraints[i], i, ninputs,
778 noutputs, &allows_mem, &allows_reg,
779 &is_inout);
780 gcc_assert (ok);
782 /* If an output operand is not a decl or indirect ref and our constraint
783 allows a register, make a temporary to act as an intermediate.
784 Make the asm insn write into that, then our caller will copy it to
785 the real output operand. Likewise for promoted variables. */
787 generating_concat_p = 0;
789 real_output_rtx[i] = NULL_RTX;
790 if ((TREE_CODE (val) == INDIRECT_REF
791 && allows_mem)
792 || (DECL_P (val)
793 && (allows_mem || REG_P (DECL_RTL (val)))
794 && ! (REG_P (DECL_RTL (val))
795 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
796 || ! allows_reg
797 || is_inout)
799 op = expand_expr (val, NULL_RTX, VOIDmode, EXPAND_WRITE);
800 if (MEM_P (op))
801 op = validize_mem (op);
803 if (! allows_reg && !MEM_P (op))
804 error ("output number %d not directly addressable", i);
805 if ((! allows_mem && MEM_P (op))
806 || GET_CODE (op) == CONCAT)
808 real_output_rtx[i] = op;
809 op = gen_reg_rtx (GET_MODE (op));
810 if (is_inout)
811 emit_move_insn (op, real_output_rtx[i]);
814 else
816 op = assign_temp (type, 0, 0, 1);
817 op = validize_mem (op);
818 TREE_VALUE (tail) = make_tree (type, op);
820 output_rtx[i] = op;
822 generating_concat_p = old_generating_concat_p;
824 if (is_inout)
826 inout_mode[ninout] = TYPE_MODE (type);
827 inout_opnum[ninout++] = i;
830 if (decl_conflicts_with_clobbers_p (val, clobbered_regs))
831 clobber_conflict_found = 1;
834 /* Make vectors for the expression-rtx, constraint strings,
835 and named operands. */
837 argvec = rtvec_alloc (ninputs);
838 constraintvec = rtvec_alloc (ninputs);
840 body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
841 : GET_MODE (output_rtx[0])),
842 ggc_strdup (TREE_STRING_POINTER (string)),
843 empty_string, 0, argvec, constraintvec,
844 locus);
846 MEM_VOLATILE_P (body) = vol;
848 /* Eval the inputs and put them into ARGVEC.
849 Put their constraints into ASM_INPUTs and store in CONSTRAINTS. */
851 for (i = 0, tail = inputs; tail; tail = TREE_CHAIN (tail), ++i)
853 bool allows_reg, allows_mem;
854 const char *constraint;
855 tree val, type;
856 rtx op;
857 bool ok;
859 constraint = constraints[i + noutputs];
860 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, ninout,
861 constraints, &allows_mem, &allows_reg);
862 gcc_assert (ok);
864 generating_concat_p = 0;
866 val = TREE_VALUE (tail);
867 type = TREE_TYPE (val);
868 op = expand_expr (val, NULL_RTX, VOIDmode,
869 (allows_mem && !allows_reg
870 ? EXPAND_MEMORY : EXPAND_NORMAL));
872 /* Never pass a CONCAT to an ASM. */
873 if (GET_CODE (op) == CONCAT)
874 op = force_reg (GET_MODE (op), op);
875 else if (MEM_P (op))
876 op = validize_mem (op);
878 if (asm_operand_ok (op, constraint) <= 0)
880 if (allows_reg && TYPE_MODE (type) != BLKmode)
881 op = force_reg (TYPE_MODE (type), op);
882 else if (!allows_mem)
883 warning (0, "asm operand %d probably doesn%'t match constraints",
884 i + noutputs);
885 else if (MEM_P (op))
887 /* We won't recognize either volatile memory or memory
888 with a queued address as available a memory_operand
889 at this point. Ignore it: clearly this *is* a memory. */
891 else
893 warning (0, "use of memory input without lvalue in "
894 "asm operand %d is deprecated", i + noutputs);
896 if (CONSTANT_P (op))
898 rtx mem = force_const_mem (TYPE_MODE (type), op);
899 if (mem)
900 op = validize_mem (mem);
901 else
902 op = force_reg (TYPE_MODE (type), op);
904 if (REG_P (op)
905 || GET_CODE (op) == SUBREG
906 || GET_CODE (op) == CONCAT)
908 tree qual_type = build_qualified_type (type,
909 (TYPE_QUALS (type)
910 | TYPE_QUAL_CONST));
911 rtx memloc = assign_temp (qual_type, 1, 1, 1);
912 memloc = validize_mem (memloc);
913 emit_move_insn (memloc, op);
914 op = memloc;
919 generating_concat_p = old_generating_concat_p;
920 ASM_OPERANDS_INPUT (body, i) = op;
922 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
923 = gen_rtx_ASM_INPUT (TYPE_MODE (type),
924 ggc_strdup (constraints[i + noutputs]));
926 if (decl_conflicts_with_clobbers_p (val, clobbered_regs))
927 clobber_conflict_found = 1;
930 /* Protect all the operands from the queue now that they have all been
931 evaluated. */
933 generating_concat_p = 0;
935 /* For in-out operands, copy output rtx to input rtx. */
936 for (i = 0; i < ninout; i++)
938 int j = inout_opnum[i];
939 char buffer[16];
941 ASM_OPERANDS_INPUT (body, ninputs - ninout + i)
942 = output_rtx[j];
944 sprintf (buffer, "%d", j);
945 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, ninputs - ninout + i)
946 = gen_rtx_ASM_INPUT (inout_mode[i], ggc_strdup (buffer));
949 generating_concat_p = old_generating_concat_p;
951 /* Now, for each output, construct an rtx
952 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
953 ARGVEC CONSTRAINTS OPNAMES))
954 If there is more than one, put them inside a PARALLEL. */
956 if (noutputs == 1 && nclobbers == 0)
958 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = ggc_strdup (constraints[0]);
959 emit_insn (gen_rtx_SET (VOIDmode, output_rtx[0], body));
962 else if (noutputs == 0 && nclobbers == 0)
964 /* No output operands: put in a raw ASM_OPERANDS rtx. */
965 emit_insn (body);
968 else
970 rtx obody = body;
971 int num = noutputs;
973 if (num == 0)
974 num = 1;
976 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
978 /* For each output operand, store a SET. */
979 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
981 XVECEXP (body, 0, i)
982 = gen_rtx_SET (VOIDmode,
983 output_rtx[i],
984 gen_rtx_ASM_OPERANDS
985 (GET_MODE (output_rtx[i]),
986 ggc_strdup (TREE_STRING_POINTER (string)),
987 ggc_strdup (constraints[i]),
988 i, argvec, constraintvec, locus));
990 MEM_VOLATILE_P (SET_SRC (XVECEXP (body, 0, i))) = vol;
993 /* If there are no outputs (but there are some clobbers)
994 store the bare ASM_OPERANDS into the PARALLEL. */
996 if (i == 0)
997 XVECEXP (body, 0, i++) = obody;
999 /* Store (clobber REG) for each clobbered register specified. */
1001 for (tail = clobbers; tail; tail = TREE_CHAIN (tail))
1003 const char *regname = TREE_STRING_POINTER (TREE_VALUE (tail));
1004 int j = decode_reg_name (regname);
1005 rtx clobbered_reg;
1007 if (j < 0)
1009 if (j == -3) /* `cc', which is not a register */
1010 continue;
1012 if (j == -4) /* `memory', don't cache memory across asm */
1014 XVECEXP (body, 0, i++)
1015 = gen_rtx_CLOBBER (VOIDmode,
1016 gen_rtx_MEM
1017 (BLKmode,
1018 gen_rtx_SCRATCH (VOIDmode)));
1019 continue;
1022 /* Ignore unknown register, error already signaled. */
1023 continue;
1026 /* Use QImode since that's guaranteed to clobber just one reg. */
1027 clobbered_reg = gen_rtx_REG (QImode, j);
1029 /* Do sanity check for overlap between clobbers and respectively
1030 input and outputs that hasn't been handled. Such overlap
1031 should have been detected and reported above. */
1032 if (!clobber_conflict_found)
1034 int opno;
1036 /* We test the old body (obody) contents to avoid tripping
1037 over the under-construction body. */
1038 for (opno = 0; opno < noutputs; opno++)
1039 if (reg_overlap_mentioned_p (clobbered_reg, output_rtx[opno]))
1040 internal_error ("asm clobber conflict with output operand");
1042 for (opno = 0; opno < ninputs - ninout; opno++)
1043 if (reg_overlap_mentioned_p (clobbered_reg,
1044 ASM_OPERANDS_INPUT (obody, opno)))
1045 internal_error ("asm clobber conflict with input operand");
1048 XVECEXP (body, 0, i++)
1049 = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
1052 emit_insn (body);
1055 /* For any outputs that needed reloading into registers, spill them
1056 back to where they belong. */
1057 for (i = 0; i < noutputs; ++i)
1058 if (real_output_rtx[i])
1059 emit_move_insn (real_output_rtx[i], output_rtx[i]);
1061 free_temp_slots ();
1064 void
1065 expand_asm_expr (tree exp)
1067 int noutputs, i;
1068 tree outputs, tail;
1069 tree *o;
1071 if (ASM_INPUT_P (exp))
1073 expand_asm (ASM_STRING (exp), ASM_VOLATILE_P (exp));
1074 return;
1077 outputs = ASM_OUTPUTS (exp);
1078 noutputs = list_length (outputs);
1079 /* o[I] is the place that output number I should be written. */
1080 o = (tree *) alloca (noutputs * sizeof (tree));
1082 /* Record the contents of OUTPUTS before it is modified. */
1083 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
1084 o[i] = TREE_VALUE (tail);
1086 /* Generate the ASM_OPERANDS insn; store into the TREE_VALUEs of
1087 OUTPUTS some trees for where the values were actually stored. */
1088 expand_asm_operands (ASM_STRING (exp), outputs, ASM_INPUTS (exp),
1089 ASM_CLOBBERS (exp), ASM_VOLATILE_P (exp),
1090 input_location);
1092 /* Copy all the intermediate outputs into the specified outputs. */
1093 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
1095 if (o[i] != TREE_VALUE (tail))
1097 expand_assignment (o[i], TREE_VALUE (tail));
1098 free_temp_slots ();
1100 /* Restore the original value so that it's correct the next
1101 time we expand this function. */
1102 TREE_VALUE (tail) = o[i];
1107 /* A subroutine of expand_asm_operands. Check that all operands have
1108 the same number of alternatives. Return true if so. */
1110 static bool
1111 check_operand_nalternatives (tree outputs, tree inputs)
1113 if (outputs || inputs)
1115 tree tmp = TREE_PURPOSE (outputs ? outputs : inputs);
1116 int nalternatives
1117 = n_occurrences (',', TREE_STRING_POINTER (TREE_VALUE (tmp)));
1118 tree next = inputs;
1120 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
1122 error ("too many alternatives in %<asm%>");
1123 return false;
1126 tmp = outputs;
1127 while (tmp)
1129 const char *constraint
1130 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (tmp)));
1132 if (n_occurrences (',', constraint) != nalternatives)
1134 error ("operand constraints for %<asm%> differ "
1135 "in number of alternatives");
1136 return false;
1139 if (TREE_CHAIN (tmp))
1140 tmp = TREE_CHAIN (tmp);
1141 else
1142 tmp = next, next = 0;
1146 return true;
1149 /* A subroutine of expand_asm_operands. Check that all operand names
1150 are unique. Return true if so. We rely on the fact that these names
1151 are identifiers, and so have been canonicalized by get_identifier,
1152 so all we need are pointer comparisons. */
1154 static bool
1155 check_unique_operand_names (tree outputs, tree inputs)
1157 tree i, j;
1159 for (i = outputs; i ; i = TREE_CHAIN (i))
1161 tree i_name = TREE_PURPOSE (TREE_PURPOSE (i));
1162 if (! i_name)
1163 continue;
1165 for (j = TREE_CHAIN (i); j ; j = TREE_CHAIN (j))
1166 if (simple_cst_equal (i_name, TREE_PURPOSE (TREE_PURPOSE (j))))
1167 goto failure;
1170 for (i = inputs; i ; i = TREE_CHAIN (i))
1172 tree i_name = TREE_PURPOSE (TREE_PURPOSE (i));
1173 if (! i_name)
1174 continue;
1176 for (j = TREE_CHAIN (i); j ; j = TREE_CHAIN (j))
1177 if (simple_cst_equal (i_name, TREE_PURPOSE (TREE_PURPOSE (j))))
1178 goto failure;
1179 for (j = outputs; j ; j = TREE_CHAIN (j))
1180 if (simple_cst_equal (i_name, TREE_PURPOSE (TREE_PURPOSE (j))))
1181 goto failure;
1184 return true;
1186 failure:
1187 error ("duplicate asm operand name %qs",
1188 TREE_STRING_POINTER (TREE_PURPOSE (TREE_PURPOSE (i))));
1189 return false;
1192 /* A subroutine of expand_asm_operands. Resolve the names of the operands
1193 in *POUTPUTS and *PINPUTS to numbers, and replace the name expansions in
1194 STRING and in the constraints to those numbers. */
1196 tree
1197 resolve_asm_operand_names (tree string, tree outputs, tree inputs)
1199 char *buffer;
1200 char *p;
1201 const char *c;
1202 tree t;
1204 check_unique_operand_names (outputs, inputs);
1206 /* Substitute [<name>] in input constraint strings. There should be no
1207 named operands in output constraints. */
1208 for (t = inputs; t ; t = TREE_CHAIN (t))
1210 c = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
1211 if (strchr (c, '[') != NULL)
1213 p = buffer = xstrdup (c);
1214 while ((p = strchr (p, '[')) != NULL)
1215 p = resolve_operand_name_1 (p, outputs, inputs);
1216 TREE_VALUE (TREE_PURPOSE (t))
1217 = build_string (strlen (buffer), buffer);
1218 free (buffer);
1222 /* Now check for any needed substitutions in the template. */
1223 c = TREE_STRING_POINTER (string);
1224 while ((c = strchr (c, '%')) != NULL)
1226 if (c[1] == '[')
1227 break;
1228 else if (ISALPHA (c[1]) && c[2] == '[')
1229 break;
1230 else
1232 c += 1;
1233 continue;
1237 if (c)
1239 /* OK, we need to make a copy so we can perform the substitutions.
1240 Assume that we will not need extra space--we get to remove '['
1241 and ']', which means we cannot have a problem until we have more
1242 than 999 operands. */
1243 buffer = xstrdup (TREE_STRING_POINTER (string));
1244 p = buffer + (c - TREE_STRING_POINTER (string));
1246 while ((p = strchr (p, '%')) != NULL)
1248 if (p[1] == '[')
1249 p += 1;
1250 else if (ISALPHA (p[1]) && p[2] == '[')
1251 p += 2;
1252 else
1254 p += 1;
1255 continue;
1258 p = resolve_operand_name_1 (p, outputs, inputs);
1261 string = build_string (strlen (buffer), buffer);
1262 free (buffer);
1265 return string;
1268 /* A subroutine of resolve_operand_names. P points to the '[' for a
1269 potential named operand of the form [<name>]. In place, replace
1270 the name and brackets with a number. Return a pointer to the
1271 balance of the string after substitution. */
1273 static char *
1274 resolve_operand_name_1 (char *p, tree outputs, tree inputs)
1276 char *q;
1277 int op;
1278 tree t;
1279 size_t len;
1281 /* Collect the operand name. */
1282 q = strchr (p, ']');
1283 if (!q)
1285 error ("missing close brace for named operand");
1286 return strchr (p, '\0');
1288 len = q - p - 1;
1290 /* Resolve the name to a number. */
1291 for (op = 0, t = outputs; t ; t = TREE_CHAIN (t), op++)
1293 tree name = TREE_PURPOSE (TREE_PURPOSE (t));
1294 if (name)
1296 const char *c = TREE_STRING_POINTER (name);
1297 if (strncmp (c, p + 1, len) == 0 && c[len] == '\0')
1298 goto found;
1301 for (t = inputs; t ; t = TREE_CHAIN (t), op++)
1303 tree name = TREE_PURPOSE (TREE_PURPOSE (t));
1304 if (name)
1306 const char *c = TREE_STRING_POINTER (name);
1307 if (strncmp (c, p + 1, len) == 0 && c[len] == '\0')
1308 goto found;
1312 *q = '\0';
1313 error ("undefined named operand %qs", p + 1);
1314 op = 0;
1315 found:
1317 /* Replace the name with the number. Unfortunately, not all libraries
1318 get the return value of sprintf correct, so search for the end of the
1319 generated string by hand. */
1320 sprintf (p, "%d", op);
1321 p = strchr (p, '\0');
1323 /* Verify the no extra buffer space assumption. */
1324 gcc_assert (p <= q);
1326 /* Shift the rest of the buffer down to fill the gap. */
1327 memmove (p, q + 1, strlen (q + 1) + 1);
1329 return p;
1332 /* Generate RTL to evaluate the expression EXP. */
1334 void
1335 expand_expr_stmt (tree exp)
1337 rtx value;
1338 tree type;
1340 value = expand_expr (exp, const0_rtx, VOIDmode, 0);
1341 type = TREE_TYPE (exp);
1343 /* If all we do is reference a volatile value in memory,
1344 copy it to a register to be sure it is actually touched. */
1345 if (value && MEM_P (value) && TREE_THIS_VOLATILE (exp))
1347 if (TYPE_MODE (type) == VOIDmode)
1349 else if (TYPE_MODE (type) != BLKmode)
1350 value = copy_to_reg (value);
1351 else
1353 rtx lab = gen_label_rtx ();
1355 /* Compare the value with itself to reference it. */
1356 emit_cmp_and_jump_insns (value, value, EQ,
1357 expand_expr (TYPE_SIZE (type),
1358 NULL_RTX, VOIDmode, 0),
1359 BLKmode, 0, lab);
1360 emit_label (lab);
1364 /* Free any temporaries used to evaluate this expression. */
1365 free_temp_slots ();
1368 /* Warn if EXP contains any computations whose results are not used.
1369 Return 1 if a warning is printed; 0 otherwise. LOCUS is the
1370 (potential) location of the expression. */
1373 warn_if_unused_value (tree exp, location_t locus)
1375 restart:
1376 if (TREE_USED (exp))
1377 return 0;
1379 /* Don't warn about void constructs. This includes casting to void,
1380 void function calls, and statement expressions with a final cast
1381 to void. */
1382 if (VOID_TYPE_P (TREE_TYPE (exp)))
1383 return 0;
1385 if (EXPR_HAS_LOCATION (exp))
1386 locus = EXPR_LOCATION (exp);
1388 switch (TREE_CODE (exp))
1390 case PREINCREMENT_EXPR:
1391 case POSTINCREMENT_EXPR:
1392 case PREDECREMENT_EXPR:
1393 case POSTDECREMENT_EXPR:
1394 case MODIFY_EXPR:
1395 case INIT_EXPR:
1396 case TARGET_EXPR:
1397 case CALL_EXPR:
1398 case TRY_CATCH_EXPR:
1399 case WITH_CLEANUP_EXPR:
1400 case EXIT_EXPR:
1401 return 0;
1403 case BIND_EXPR:
1404 /* For a binding, warn if no side effect within it. */
1405 exp = BIND_EXPR_BODY (exp);
1406 goto restart;
1408 case SAVE_EXPR:
1409 exp = TREE_OPERAND (exp, 0);
1410 goto restart;
1412 case TRUTH_ORIF_EXPR:
1413 case TRUTH_ANDIF_EXPR:
1414 /* In && or ||, warn if 2nd operand has no side effect. */
1415 exp = TREE_OPERAND (exp, 1);
1416 goto restart;
1418 case COMPOUND_EXPR:
1419 if (TREE_NO_WARNING (exp))
1420 return 0;
1421 if (warn_if_unused_value (TREE_OPERAND (exp, 0), locus))
1422 return 1;
1423 /* Let people do `(foo (), 0)' without a warning. */
1424 if (TREE_CONSTANT (TREE_OPERAND (exp, 1)))
1425 return 0;
1426 exp = TREE_OPERAND (exp, 1);
1427 goto restart;
1429 case NOP_EXPR:
1430 case CONVERT_EXPR:
1431 case NON_LVALUE_EXPR:
1432 /* Don't warn about conversions not explicit in the user's program. */
1433 if (TREE_NO_WARNING (exp))
1434 return 0;
1435 /* Assignment to a cast usually results in a cast of a modify.
1436 Don't complain about that. There can be an arbitrary number of
1437 casts before the modify, so we must loop until we find the first
1438 non-cast expression and then test to see if that is a modify. */
1440 tree tem = TREE_OPERAND (exp, 0);
1442 while (TREE_CODE (tem) == CONVERT_EXPR || TREE_CODE (tem) == NOP_EXPR)
1443 tem = TREE_OPERAND (tem, 0);
1445 if (TREE_CODE (tem) == MODIFY_EXPR || TREE_CODE (tem) == INIT_EXPR
1446 || TREE_CODE (tem) == CALL_EXPR)
1447 return 0;
1449 goto maybe_warn;
1451 case INDIRECT_REF:
1452 /* Don't warn about automatic dereferencing of references, since
1453 the user cannot control it. */
1454 if (TREE_CODE (TREE_TYPE (TREE_OPERAND (exp, 0))) == REFERENCE_TYPE)
1456 exp = TREE_OPERAND (exp, 0);
1457 goto restart;
1459 /* Fall through. */
1461 default:
1462 /* Referencing a volatile value is a side effect, so don't warn. */
1463 if ((DECL_P (exp) || REFERENCE_CLASS_P (exp))
1464 && TREE_THIS_VOLATILE (exp))
1465 return 0;
1467 /* If this is an expression which has no operands, there is no value
1468 to be unused. There are no such language-independent codes,
1469 but front ends may define such. */
1470 if (EXPRESSION_CLASS_P (exp) && TREE_CODE_LENGTH (TREE_CODE (exp)) == 0)
1471 return 0;
1473 maybe_warn:
1474 /* If this is an expression with side effects, don't warn. */
1475 if (TREE_SIDE_EFFECTS (exp))
1476 return 0;
1478 warning (0, "%Hvalue computed is not used", &locus);
1479 return 1;
1484 /* Generate RTL to return from the current function, with no value.
1485 (That is, we do not do anything about returning any value.) */
1487 void
1488 expand_null_return (void)
1490 /* If this function was declared to return a value, but we
1491 didn't, clobber the return registers so that they are not
1492 propagated live to the rest of the function. */
1493 clobber_return_register ();
1495 expand_null_return_1 ();
1498 /* Generate RTL to return directly from the current function.
1499 (That is, we bypass any return value.) */
1501 void
1502 expand_naked_return (void)
1504 rtx end_label;
1506 clear_pending_stack_adjust ();
1507 do_pending_stack_adjust ();
1509 end_label = naked_return_label;
1510 if (end_label == 0)
1511 end_label = naked_return_label = gen_label_rtx ();
1513 emit_jump (end_label);
1516 /* Generate RTL to return from the current function, with value VAL. */
1518 static void
1519 expand_value_return (rtx val)
1521 /* Copy the value to the return location
1522 unless it's already there. */
1524 rtx return_reg = DECL_RTL (DECL_RESULT (current_function_decl));
1525 if (return_reg != val)
1527 tree type = TREE_TYPE (DECL_RESULT (current_function_decl));
1528 if (targetm.calls.promote_function_return (TREE_TYPE (current_function_decl)))
1530 int unsignedp = TYPE_UNSIGNED (type);
1531 enum machine_mode old_mode
1532 = DECL_MODE (DECL_RESULT (current_function_decl));
1533 enum machine_mode mode
1534 = promote_mode (type, old_mode, &unsignedp, 1);
1536 if (mode != old_mode)
1537 val = convert_modes (mode, old_mode, val, unsignedp);
1539 if (GET_CODE (return_reg) == PARALLEL)
1540 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
1541 else
1542 emit_move_insn (return_reg, val);
1545 expand_null_return_1 ();
1548 /* Output a return with no value. */
1550 static void
1551 expand_null_return_1 (void)
1553 clear_pending_stack_adjust ();
1554 do_pending_stack_adjust ();
1555 emit_jump (return_label);
1558 /* Generate RTL to evaluate the expression RETVAL and return it
1559 from the current function. */
1561 void
1562 expand_return (tree retval)
1564 rtx result_rtl;
1565 rtx val = 0;
1566 tree retval_rhs;
1568 /* If function wants no value, give it none. */
1569 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
1571 expand_expr (retval, NULL_RTX, VOIDmode, 0);
1572 expand_null_return ();
1573 return;
1576 if (retval == error_mark_node)
1578 /* Treat this like a return of no value from a function that
1579 returns a value. */
1580 expand_null_return ();
1581 return;
1583 else if ((TREE_CODE (retval) == MODIFY_EXPR
1584 || TREE_CODE (retval) == INIT_EXPR)
1585 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
1586 retval_rhs = TREE_OPERAND (retval, 1);
1587 else
1588 retval_rhs = retval;
1590 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
1592 /* If we are returning the RESULT_DECL, then the value has already
1593 been stored into it, so we don't have to do anything special. */
1594 if (TREE_CODE (retval_rhs) == RESULT_DECL)
1595 expand_value_return (result_rtl);
1597 /* If the result is an aggregate that is being returned in one (or more)
1598 registers, load the registers here. The compiler currently can't handle
1599 copying a BLKmode value into registers. We could put this code in a
1600 more general area (for use by everyone instead of just function
1601 call/return), but until this feature is generally usable it is kept here
1602 (and in expand_call). */
1604 else if (retval_rhs != 0
1605 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
1606 && REG_P (result_rtl))
1608 int i;
1609 unsigned HOST_WIDE_INT bitpos, xbitpos;
1610 unsigned HOST_WIDE_INT padding_correction = 0;
1611 unsigned HOST_WIDE_INT bytes
1612 = int_size_in_bytes (TREE_TYPE (retval_rhs));
1613 int n_regs = (bytes + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
1614 unsigned int bitsize
1615 = MIN (TYPE_ALIGN (TREE_TYPE (retval_rhs)), BITS_PER_WORD);
1616 rtx *result_pseudos = alloca (sizeof (rtx) * n_regs);
1617 rtx result_reg, src = NULL_RTX, dst = NULL_RTX;
1618 rtx result_val = expand_expr (retval_rhs, NULL_RTX, VOIDmode, 0);
1619 enum machine_mode tmpmode, result_reg_mode;
1621 if (bytes == 0)
1623 expand_null_return ();
1624 return;
1627 /* If the structure doesn't take up a whole number of words, see
1628 whether the register value should be padded on the left or on
1629 the right. Set PADDING_CORRECTION to the number of padding
1630 bits needed on the left side.
1632 In most ABIs, the structure will be returned at the least end of
1633 the register, which translates to right padding on little-endian
1634 targets and left padding on big-endian targets. The opposite
1635 holds if the structure is returned at the most significant
1636 end of the register. */
1637 if (bytes % UNITS_PER_WORD != 0
1638 && (targetm.calls.return_in_msb (TREE_TYPE (retval_rhs))
1639 ? !BYTES_BIG_ENDIAN
1640 : BYTES_BIG_ENDIAN))
1641 padding_correction = (BITS_PER_WORD - ((bytes % UNITS_PER_WORD)
1642 * BITS_PER_UNIT));
1644 /* Copy the structure BITSIZE bits at a time. */
1645 for (bitpos = 0, xbitpos = padding_correction;
1646 bitpos < bytes * BITS_PER_UNIT;
1647 bitpos += bitsize, xbitpos += bitsize)
1649 /* We need a new destination pseudo each time xbitpos is
1650 on a word boundary and when xbitpos == padding_correction
1651 (the first time through). */
1652 if (xbitpos % BITS_PER_WORD == 0
1653 || xbitpos == padding_correction)
1655 /* Generate an appropriate register. */
1656 dst = gen_reg_rtx (word_mode);
1657 result_pseudos[xbitpos / BITS_PER_WORD] = dst;
1659 /* Clear the destination before we move anything into it. */
1660 emit_move_insn (dst, CONST0_RTX (GET_MODE (dst)));
1663 /* We need a new source operand each time bitpos is on a word
1664 boundary. */
1665 if (bitpos % BITS_PER_WORD == 0)
1666 src = operand_subword_force (result_val,
1667 bitpos / BITS_PER_WORD,
1668 BLKmode);
1670 /* Use bitpos for the source extraction (left justified) and
1671 xbitpos for the destination store (right justified). */
1672 store_bit_field (dst, bitsize, xbitpos % BITS_PER_WORD, word_mode,
1673 extract_bit_field (src, bitsize,
1674 bitpos % BITS_PER_WORD, 1,
1675 NULL_RTX, word_mode, word_mode));
1678 tmpmode = GET_MODE (result_rtl);
1679 if (tmpmode == BLKmode)
1681 /* Find the smallest integer mode large enough to hold the
1682 entire structure and use that mode instead of BLKmode
1683 on the USE insn for the return register. */
1684 for (tmpmode = GET_CLASS_NARROWEST_MODE (MODE_INT);
1685 tmpmode != VOIDmode;
1686 tmpmode = GET_MODE_WIDER_MODE (tmpmode))
1687 /* Have we found a large enough mode? */
1688 if (GET_MODE_SIZE (tmpmode) >= bytes)
1689 break;
1691 /* A suitable mode should have been found. */
1692 gcc_assert (tmpmode != VOIDmode);
1694 PUT_MODE (result_rtl, tmpmode);
1697 if (GET_MODE_SIZE (tmpmode) < GET_MODE_SIZE (word_mode))
1698 result_reg_mode = word_mode;
1699 else
1700 result_reg_mode = tmpmode;
1701 result_reg = gen_reg_rtx (result_reg_mode);
1703 for (i = 0; i < n_regs; i++)
1704 emit_move_insn (operand_subword (result_reg, i, 0, result_reg_mode),
1705 result_pseudos[i]);
1707 if (tmpmode != result_reg_mode)
1708 result_reg = gen_lowpart (tmpmode, result_reg);
1710 expand_value_return (result_reg);
1712 else if (retval_rhs != 0
1713 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
1714 && (REG_P (result_rtl)
1715 || (GET_CODE (result_rtl) == PARALLEL)))
1717 /* Calculate the return value into a temporary (usually a pseudo
1718 reg). */
1719 tree ot = TREE_TYPE (DECL_RESULT (current_function_decl));
1720 tree nt = build_qualified_type (ot, TYPE_QUALS (ot) | TYPE_QUAL_CONST);
1722 val = assign_temp (nt, 0, 0, 1);
1723 val = expand_expr (retval_rhs, val, GET_MODE (val), 0);
1724 val = force_not_mem (val);
1725 /* Return the calculated value. */
1726 expand_value_return (val);
1728 else
1730 /* No hard reg used; calculate value into hard return reg. */
1731 expand_expr (retval, const0_rtx, VOIDmode, 0);
1732 expand_value_return (result_rtl);
1736 /* Given a pointer to a BLOCK node return nonzero if (and only if) the node
1737 in question represents the outermost pair of curly braces (i.e. the "body
1738 block") of a function or method.
1740 For any BLOCK node representing a "body block" of a function or method, the
1741 BLOCK_SUPERCONTEXT of the node will point to another BLOCK node which
1742 represents the outermost (function) scope for the function or method (i.e.
1743 the one which includes the formal parameters). The BLOCK_SUPERCONTEXT of
1744 *that* node in turn will point to the relevant FUNCTION_DECL node. */
1747 is_body_block (tree stmt)
1749 if (lang_hooks.no_body_blocks)
1750 return 0;
1752 if (TREE_CODE (stmt) == BLOCK)
1754 tree parent = BLOCK_SUPERCONTEXT (stmt);
1756 if (parent && TREE_CODE (parent) == BLOCK)
1758 tree grandparent = BLOCK_SUPERCONTEXT (parent);
1760 if (grandparent && TREE_CODE (grandparent) == FUNCTION_DECL)
1761 return 1;
1765 return 0;
1768 /* Emit code to restore vital registers at the beginning of a nonlocal goto
1769 handler. */
1770 static void
1771 expand_nl_goto_receiver (void)
1773 /* Clobber the FP when we get here, so we have to make sure it's
1774 marked as used by this function. */
1775 emit_insn (gen_rtx_USE (VOIDmode, hard_frame_pointer_rtx));
1777 /* Mark the static chain as clobbered here so life information
1778 doesn't get messed up for it. */
1779 emit_insn (gen_rtx_CLOBBER (VOIDmode, static_chain_rtx));
1781 #ifdef HAVE_nonlocal_goto
1782 if (! HAVE_nonlocal_goto)
1783 #endif
1784 /* First adjust our frame pointer to its actual value. It was
1785 previously set to the start of the virtual area corresponding to
1786 the stacked variables when we branched here and now needs to be
1787 adjusted to the actual hardware fp value.
1789 Assignments are to virtual registers are converted by
1790 instantiate_virtual_regs into the corresponding assignment
1791 to the underlying register (fp in this case) that makes
1792 the original assignment true.
1793 So the following insn will actually be
1794 decrementing fp by STARTING_FRAME_OFFSET. */
1795 emit_move_insn (virtual_stack_vars_rtx, hard_frame_pointer_rtx);
1797 #if ARG_POINTER_REGNUM != HARD_FRAME_POINTER_REGNUM
1798 if (fixed_regs[ARG_POINTER_REGNUM])
1800 #ifdef ELIMINABLE_REGS
1801 /* If the argument pointer can be eliminated in favor of the
1802 frame pointer, we don't need to restore it. We assume here
1803 that if such an elimination is present, it can always be used.
1804 This is the case on all known machines; if we don't make this
1805 assumption, we do unnecessary saving on many machines. */
1806 static const struct elims {const int from, to;} elim_regs[] = ELIMINABLE_REGS;
1807 size_t i;
1809 for (i = 0; i < ARRAY_SIZE (elim_regs); i++)
1810 if (elim_regs[i].from == ARG_POINTER_REGNUM
1811 && elim_regs[i].to == HARD_FRAME_POINTER_REGNUM)
1812 break;
1814 if (i == ARRAY_SIZE (elim_regs))
1815 #endif
1817 /* Now restore our arg pointer from the address at which it
1818 was saved in our stack frame. */
1819 emit_move_insn (virtual_incoming_args_rtx,
1820 copy_to_reg (get_arg_pointer_save_area (cfun)));
1823 #endif
1825 #ifdef HAVE_nonlocal_goto_receiver
1826 if (HAVE_nonlocal_goto_receiver)
1827 emit_insn (gen_nonlocal_goto_receiver ());
1828 #endif
1830 /* @@@ This is a kludge. Not all machine descriptions define a blockage
1831 insn, but we must not allow the code we just generated to be reordered
1832 by scheduling. Specifically, the update of the frame pointer must
1833 happen immediately, not later. So emit an ASM_INPUT to act as blockage
1834 insn. */
1835 emit_insn (gen_rtx_ASM_INPUT (VOIDmode, ""));
1838 /* Generate RTL for the automatic variable declaration DECL.
1839 (Other kinds of declarations are simply ignored if seen here.) */
1841 void
1842 expand_decl (tree decl)
1844 tree type;
1846 type = TREE_TYPE (decl);
1848 /* For a CONST_DECL, set mode, alignment, and sizes from those of the
1849 type in case this node is used in a reference. */
1850 if (TREE_CODE (decl) == CONST_DECL)
1852 DECL_MODE (decl) = TYPE_MODE (type);
1853 DECL_ALIGN (decl) = TYPE_ALIGN (type);
1854 DECL_SIZE (decl) = TYPE_SIZE (type);
1855 DECL_SIZE_UNIT (decl) = TYPE_SIZE_UNIT (type);
1856 return;
1859 /* Otherwise, only automatic variables need any expansion done. Static and
1860 external variables, and external functions, will be handled by
1861 `assemble_variable' (called from finish_decl). TYPE_DECL requires
1862 nothing. PARM_DECLs are handled in `assign_parms'. */
1863 if (TREE_CODE (decl) != VAR_DECL)
1864 return;
1866 if (TREE_STATIC (decl) || DECL_EXTERNAL (decl))
1867 return;
1869 /* Create the RTL representation for the variable. */
1871 if (type == error_mark_node)
1872 SET_DECL_RTL (decl, gen_rtx_MEM (BLKmode, const0_rtx));
1874 else if (DECL_SIZE (decl) == 0)
1875 /* Variable with incomplete type. */
1877 rtx x;
1878 if (DECL_INITIAL (decl) == 0)
1879 /* Error message was already done; now avoid a crash. */
1880 x = gen_rtx_MEM (BLKmode, const0_rtx);
1881 else
1882 /* An initializer is going to decide the size of this array.
1883 Until we know the size, represent its address with a reg. */
1884 x = gen_rtx_MEM (BLKmode, gen_reg_rtx (Pmode));
1886 set_mem_attributes (x, decl, 1);
1887 SET_DECL_RTL (decl, x);
1889 else if (use_register_for_decl (decl))
1891 /* Automatic variable that can go in a register. */
1892 int unsignedp = TYPE_UNSIGNED (type);
1893 enum machine_mode reg_mode
1894 = promote_mode (type, DECL_MODE (decl), &unsignedp, 0);
1896 SET_DECL_RTL (decl, gen_reg_rtx (reg_mode));
1898 /* Note if the object is a user variable. */
1899 if (!DECL_ARTIFICIAL (decl))
1901 mark_user_reg (DECL_RTL (decl));
1903 /* Trust user variables which have a pointer type to really
1904 be pointers. Do not trust compiler generated temporaries
1905 as our type system is totally busted as it relates to
1906 pointer arithmetic which translates into lots of compiler
1907 generated objects with pointer types, but which are not really
1908 pointers. */
1909 if (POINTER_TYPE_P (type))
1910 mark_reg_pointer (DECL_RTL (decl),
1911 TYPE_ALIGN (TREE_TYPE (TREE_TYPE (decl))));
1915 else if (TREE_CODE (DECL_SIZE_UNIT (decl)) == INTEGER_CST
1916 && ! (flag_stack_check && ! STACK_CHECK_BUILTIN
1917 && 0 < compare_tree_int (DECL_SIZE_UNIT (decl),
1918 STACK_CHECK_MAX_VAR_SIZE)))
1920 /* Variable of fixed size that goes on the stack. */
1921 rtx oldaddr = 0;
1922 rtx addr;
1923 rtx x;
1925 /* If we previously made RTL for this decl, it must be an array
1926 whose size was determined by the initializer.
1927 The old address was a register; set that register now
1928 to the proper address. */
1929 if (DECL_RTL_SET_P (decl))
1931 gcc_assert (MEM_P (DECL_RTL (decl)));
1932 gcc_assert (REG_P (XEXP (DECL_RTL (decl), 0)));
1933 oldaddr = XEXP (DECL_RTL (decl), 0);
1936 /* Set alignment we actually gave this decl. */
1937 DECL_ALIGN (decl) = (DECL_MODE (decl) == BLKmode ? BIGGEST_ALIGNMENT
1938 : GET_MODE_BITSIZE (DECL_MODE (decl)));
1939 DECL_USER_ALIGN (decl) = 0;
1941 x = assign_temp (decl, 1, 1, 1);
1942 set_mem_attributes (x, decl, 1);
1943 SET_DECL_RTL (decl, x);
1945 if (oldaddr)
1947 addr = force_operand (XEXP (DECL_RTL (decl), 0), oldaddr);
1948 if (addr != oldaddr)
1949 emit_move_insn (oldaddr, addr);
1952 else
1953 /* Dynamic-size object: must push space on the stack. */
1955 rtx address, size, x;
1957 /* Record the stack pointer on entry to block, if have
1958 not already done so. */
1959 do_pending_stack_adjust ();
1961 /* Compute the variable's size, in bytes. This will expand any
1962 needed SAVE_EXPRs for the first time. */
1963 size = expand_expr (DECL_SIZE_UNIT (decl), NULL_RTX, VOIDmode, 0);
1964 free_temp_slots ();
1966 /* Allocate space on the stack for the variable. Note that
1967 DECL_ALIGN says how the variable is to be aligned and we
1968 cannot use it to conclude anything about the alignment of
1969 the size. */
1970 address = allocate_dynamic_stack_space (size, NULL_RTX,
1971 TYPE_ALIGN (TREE_TYPE (decl)));
1973 /* Reference the variable indirect through that rtx. */
1974 x = gen_rtx_MEM (DECL_MODE (decl), address);
1975 set_mem_attributes (x, decl, 1);
1976 SET_DECL_RTL (decl, x);
1979 /* Indicate the alignment we actually gave this variable. */
1980 #ifdef STACK_BOUNDARY
1981 DECL_ALIGN (decl) = STACK_BOUNDARY;
1982 #else
1983 DECL_ALIGN (decl) = BIGGEST_ALIGNMENT;
1984 #endif
1985 DECL_USER_ALIGN (decl) = 0;
1989 /* Emit code to save the current value of stack. */
1991 expand_stack_save (void)
1993 rtx ret = NULL_RTX;
1995 do_pending_stack_adjust ();
1996 emit_stack_save (SAVE_BLOCK, &ret, NULL_RTX);
1997 return ret;
2000 /* Emit code to restore the current value of stack. */
2001 void
2002 expand_stack_restore (tree var)
2004 rtx sa = DECL_RTL (var);
2006 emit_stack_restore (SAVE_BLOCK, sa, NULL_RTX);
2009 /* DECL is an anonymous union. CLEANUP is a cleanup for DECL.
2010 DECL_ELTS is the list of elements that belong to DECL's type.
2011 In each, the TREE_VALUE is a VAR_DECL, and the TREE_PURPOSE a cleanup. */
2013 void
2014 expand_anon_union_decl (tree decl, tree cleanup ATTRIBUTE_UNUSED,
2015 tree decl_elts)
2017 rtx x;
2018 tree t;
2020 /* If any of the elements are addressable, so is the entire union. */
2021 for (t = decl_elts; t; t = TREE_CHAIN (t))
2022 if (TREE_ADDRESSABLE (TREE_VALUE (t)))
2024 TREE_ADDRESSABLE (decl) = 1;
2025 break;
2028 expand_decl (decl);
2029 x = DECL_RTL (decl);
2031 /* Go through the elements, assigning RTL to each. */
2032 for (t = decl_elts; t; t = TREE_CHAIN (t))
2034 tree decl_elt = TREE_VALUE (t);
2035 enum machine_mode mode = TYPE_MODE (TREE_TYPE (decl_elt));
2036 rtx decl_rtl;
2038 /* If any of the elements are addressable, so is the entire
2039 union. */
2040 if (TREE_USED (decl_elt))
2041 TREE_USED (decl) = 1;
2043 /* Propagate the union's alignment to the elements. */
2044 DECL_ALIGN (decl_elt) = DECL_ALIGN (decl);
2045 DECL_USER_ALIGN (decl_elt) = DECL_USER_ALIGN (decl);
2047 /* If the element has BLKmode and the union doesn't, the union is
2048 aligned such that the element doesn't need to have BLKmode, so
2049 change the element's mode to the appropriate one for its size. */
2050 if (mode == BLKmode && DECL_MODE (decl) != BLKmode)
2051 DECL_MODE (decl_elt) = mode
2052 = mode_for_size_tree (DECL_SIZE (decl_elt), MODE_INT, 1);
2054 if (mode == GET_MODE (x))
2055 decl_rtl = x;
2056 else if (MEM_P (x))
2057 /* (SUBREG (MEM ...)) at RTL generation time is invalid, so we
2058 instead create a new MEM rtx with the proper mode. */
2059 decl_rtl = adjust_address_nv (x, mode, 0);
2060 else
2062 gcc_assert (REG_P (x));
2063 decl_rtl = gen_lowpart_SUBREG (mode, x);
2065 SET_DECL_RTL (decl_elt, decl_rtl);
2069 /* Do the insertion of a case label into case_list. The labels are
2070 fed to us in descending order from the sorted vector of case labels used
2071 in the tree part of the middle end. So the list we construct is
2072 sorted in ascending order. The bounds on the case range, LOW and HIGH,
2073 are converted to case's index type TYPE. */
2075 static struct case_node *
2076 add_case_node (struct case_node *head, tree type, tree low, tree high,
2077 tree label)
2079 tree min_value, max_value;
2080 struct case_node *r;
2082 gcc_assert (TREE_CODE (low) == INTEGER_CST);
2083 gcc_assert (!high || TREE_CODE (high) == INTEGER_CST);
2085 min_value = TYPE_MIN_VALUE (type);
2086 max_value = TYPE_MAX_VALUE (type);
2088 /* If there's no HIGH value, then this is not a case range; it's
2089 just a simple case label. But that's just a degenerate case
2090 range.
2091 If the bounds are equal, turn this into the one-value case. */
2092 if (!high || tree_int_cst_equal (low, high))
2094 /* If the simple case value is unreachable, ignore it. */
2095 if ((TREE_CODE (min_value) == INTEGER_CST
2096 && tree_int_cst_compare (low, min_value) < 0)
2097 || (TREE_CODE (max_value) == INTEGER_CST
2098 && tree_int_cst_compare (low, max_value) > 0))
2099 return head;
2100 low = fold_convert (type, low);
2101 high = low;
2103 else
2105 /* If the entire case range is unreachable, ignore it. */
2106 if ((TREE_CODE (min_value) == INTEGER_CST
2107 && tree_int_cst_compare (high, min_value) < 0)
2108 || (TREE_CODE (max_value) == INTEGER_CST
2109 && tree_int_cst_compare (low, max_value) > 0))
2110 return head;
2112 /* If the lower bound is less than the index type's minimum
2113 value, truncate the range bounds. */
2114 if (TREE_CODE (min_value) == INTEGER_CST
2115 && tree_int_cst_compare (low, min_value) < 0)
2116 low = min_value;
2117 low = fold_convert (type, low);
2119 /* If the upper bound is greater than the index type's maximum
2120 value, truncate the range bounds. */
2121 if (TREE_CODE (max_value) == INTEGER_CST
2122 && tree_int_cst_compare (high, max_value) > 0)
2123 high = max_value;
2124 high = fold_convert (type, high);
2128 /* Add this label to the chain. */
2129 r = ggc_alloc (sizeof (struct case_node));
2130 r->low = low;
2131 r->high = high;
2132 r->code_label = label;
2133 r->parent = r->left = NULL;
2134 r->right = head;
2135 return r;
2138 /* Maximum number of case bit tests. */
2139 #define MAX_CASE_BIT_TESTS 3
2141 /* By default, enable case bit tests on targets with ashlsi3. */
2142 #ifndef CASE_USE_BIT_TESTS
2143 #define CASE_USE_BIT_TESTS (ashl_optab->handlers[word_mode].insn_code \
2144 != CODE_FOR_nothing)
2145 #endif
2148 /* A case_bit_test represents a set of case nodes that may be
2149 selected from using a bit-wise comparison. HI and LO hold
2150 the integer to be tested against, LABEL contains the label
2151 to jump to upon success and BITS counts the number of case
2152 nodes handled by this test, typically the number of bits
2153 set in HI:LO. */
2155 struct case_bit_test
2157 HOST_WIDE_INT hi;
2158 HOST_WIDE_INT lo;
2159 rtx label;
2160 int bits;
2163 /* Determine whether "1 << x" is relatively cheap in word_mode. */
2165 static
2166 bool lshift_cheap_p (void)
2168 static bool init = false;
2169 static bool cheap = true;
2171 if (!init)
2173 rtx reg = gen_rtx_REG (word_mode, 10000);
2174 int cost = rtx_cost (gen_rtx_ASHIFT (word_mode, const1_rtx, reg), SET);
2175 cheap = cost < COSTS_N_INSNS (3);
2176 init = true;
2179 return cheap;
2182 /* Comparison function for qsort to order bit tests by decreasing
2183 number of case nodes, i.e. the node with the most cases gets
2184 tested first. */
2186 static int
2187 case_bit_test_cmp (const void *p1, const void *p2)
2189 const struct case_bit_test *d1 = p1;
2190 const struct case_bit_test *d2 = p2;
2192 return d2->bits - d1->bits;
2195 /* Expand a switch statement by a short sequence of bit-wise
2196 comparisons. "switch(x)" is effectively converted into
2197 "if ((1 << (x-MINVAL)) & CST)" where CST and MINVAL are
2198 integer constants.
2200 INDEX_EXPR is the value being switched on, which is of
2201 type INDEX_TYPE. MINVAL is the lowest case value of in
2202 the case nodes, of INDEX_TYPE type, and RANGE is highest
2203 value minus MINVAL, also of type INDEX_TYPE. NODES is
2204 the set of case nodes, and DEFAULT_LABEL is the label to
2205 branch to should none of the cases match.
2207 There *MUST* be MAX_CASE_BIT_TESTS or less unique case
2208 node targets. */
2210 static void
2211 emit_case_bit_tests (tree index_type, tree index_expr, tree minval,
2212 tree range, case_node_ptr nodes, rtx default_label)
2214 struct case_bit_test test[MAX_CASE_BIT_TESTS];
2215 enum machine_mode mode;
2216 rtx expr, index, label;
2217 unsigned int i,j,lo,hi;
2218 struct case_node *n;
2219 unsigned int count;
2221 count = 0;
2222 for (n = nodes; n; n = n->right)
2224 label = label_rtx (n->code_label);
2225 for (i = 0; i < count; i++)
2226 if (label == test[i].label)
2227 break;
2229 if (i == count)
2231 gcc_assert (count < MAX_CASE_BIT_TESTS);
2232 test[i].hi = 0;
2233 test[i].lo = 0;
2234 test[i].label = label;
2235 test[i].bits = 1;
2236 count++;
2238 else
2239 test[i].bits++;
2241 lo = tree_low_cst (fold_build2 (MINUS_EXPR, index_type,
2242 n->low, minval), 1);
2243 hi = tree_low_cst (fold_build2 (MINUS_EXPR, index_type,
2244 n->high, minval), 1);
2245 for (j = lo; j <= hi; j++)
2246 if (j >= HOST_BITS_PER_WIDE_INT)
2247 test[i].hi |= (HOST_WIDE_INT) 1 << (j - HOST_BITS_PER_INT);
2248 else
2249 test[i].lo |= (HOST_WIDE_INT) 1 << j;
2252 qsort (test, count, sizeof(*test), case_bit_test_cmp);
2254 index_expr = fold_build2 (MINUS_EXPR, index_type,
2255 fold_convert (index_type, index_expr),
2256 fold_convert (index_type, minval));
2257 index = expand_expr (index_expr, NULL_RTX, VOIDmode, 0);
2258 do_pending_stack_adjust ();
2260 mode = TYPE_MODE (index_type);
2261 expr = expand_expr (range, NULL_RTX, VOIDmode, 0);
2262 emit_cmp_and_jump_insns (index, expr, GTU, NULL_RTX, mode, 1,
2263 default_label);
2265 index = convert_to_mode (word_mode, index, 0);
2266 index = expand_binop (word_mode, ashl_optab, const1_rtx,
2267 index, NULL_RTX, 1, OPTAB_WIDEN);
2269 for (i = 0; i < count; i++)
2271 expr = immed_double_const (test[i].lo, test[i].hi, word_mode);
2272 expr = expand_binop (word_mode, and_optab, index, expr,
2273 NULL_RTX, 1, OPTAB_WIDEN);
2274 emit_cmp_and_jump_insns (expr, const0_rtx, NE, NULL_RTX,
2275 word_mode, 1, test[i].label);
2278 emit_jump (default_label);
2281 #ifndef HAVE_casesi
2282 #define HAVE_casesi 0
2283 #endif
2285 #ifndef HAVE_tablejump
2286 #define HAVE_tablejump 0
2287 #endif
2289 /* Terminate a case (Pascal) or switch (C) statement
2290 in which ORIG_INDEX is the expression to be tested.
2291 If ORIG_TYPE is not NULL, it is the original ORIG_INDEX
2292 type as given in the source before any compiler conversions.
2293 Generate the code to test it and jump to the right place. */
2295 void
2296 expand_case (tree exp)
2298 tree minval = NULL_TREE, maxval = NULL_TREE, range = NULL_TREE;
2299 rtx default_label = 0;
2300 struct case_node *n;
2301 unsigned int count, uniq;
2302 rtx index;
2303 rtx table_label;
2304 int ncases;
2305 rtx *labelvec;
2306 int i, fail;
2307 rtx before_case, end, lab;
2309 tree vec = SWITCH_LABELS (exp);
2310 tree orig_type = TREE_TYPE (exp);
2311 tree index_expr = SWITCH_COND (exp);
2312 tree index_type = TREE_TYPE (index_expr);
2313 int unsignedp = TYPE_UNSIGNED (index_type);
2315 /* The insn after which the case dispatch should finally
2316 be emitted. Zero for a dummy. */
2317 rtx start;
2319 /* A list of case labels; it is first built as a list and it may then
2320 be rearranged into a nearly balanced binary tree. */
2321 struct case_node *case_list = 0;
2323 /* Label to jump to if no case matches. */
2324 tree default_label_decl;
2326 /* The switch body is lowered in gimplify.c, we should never have
2327 switches with a non-NULL SWITCH_BODY here. */
2328 gcc_assert (!SWITCH_BODY (exp));
2329 gcc_assert (SWITCH_LABELS (exp));
2331 do_pending_stack_adjust ();
2333 /* An ERROR_MARK occurs for various reasons including invalid data type. */
2334 if (index_type != error_mark_node)
2336 tree elt;
2337 bitmap label_bitmap;
2339 /* cleanup_tree_cfg removes all SWITCH_EXPR with their index
2340 expressions being INTEGER_CST. */
2341 gcc_assert (TREE_CODE (index_expr) != INTEGER_CST);
2343 /* The default case is at the end of TREE_VEC. */
2344 elt = TREE_VEC_ELT (vec, TREE_VEC_LENGTH (vec) - 1);
2345 gcc_assert (!CASE_HIGH (elt));
2346 gcc_assert (!CASE_LOW (elt));
2347 default_label_decl = CASE_LABEL (elt);
2349 for (i = TREE_VEC_LENGTH (vec) - 1; --i >= 0; )
2351 elt = TREE_VEC_ELT (vec, i);
2352 gcc_assert (CASE_LOW (elt));
2353 case_list = add_case_node (case_list, index_type,
2354 CASE_LOW (elt), CASE_HIGH (elt),
2355 CASE_LABEL (elt));
2359 /* Make sure start points to something that won't need any
2360 transformation before the end of this function. */
2361 start = get_last_insn ();
2362 if (! NOTE_P (start))
2364 emit_note (NOTE_INSN_DELETED);
2365 start = get_last_insn ();
2368 default_label = label_rtx (default_label_decl);
2370 before_case = get_last_insn ();
2372 /* Get upper and lower bounds of case values. */
2374 uniq = 0;
2375 count = 0;
2376 label_bitmap = BITMAP_ALLOC (NULL);
2377 for (n = case_list; n; n = n->right)
2379 /* Count the elements and track the largest and smallest
2380 of them (treating them as signed even if they are not). */
2381 if (count++ == 0)
2383 minval = n->low;
2384 maxval = n->high;
2386 else
2388 if (INT_CST_LT (n->low, minval))
2389 minval = n->low;
2390 if (INT_CST_LT (maxval, n->high))
2391 maxval = n->high;
2393 /* A range counts double, since it requires two compares. */
2394 if (! tree_int_cst_equal (n->low, n->high))
2395 count++;
2397 /* If we have not seen this label yet, then increase the
2398 number of unique case node targets seen. */
2399 lab = label_rtx (n->code_label);
2400 if (!bitmap_bit_p (label_bitmap, CODE_LABEL_NUMBER (lab)))
2402 bitmap_set_bit (label_bitmap, CODE_LABEL_NUMBER (lab));
2403 uniq++;
2407 BITMAP_FREE (label_bitmap);
2409 /* cleanup_tree_cfg removes all SWITCH_EXPR with a single
2410 destination, such as one with a default case only. However,
2411 it doesn't remove cases that are out of range for the switch
2412 type, so we may still get a zero here. */
2413 if (count == 0)
2415 emit_jump (default_label);
2416 return;
2419 /* Compute span of values. */
2420 range = fold_build2 (MINUS_EXPR, index_type, maxval, minval);
2422 /* Try implementing this switch statement by a short sequence of
2423 bit-wise comparisons. However, we let the binary-tree case
2424 below handle constant index expressions. */
2425 if (CASE_USE_BIT_TESTS
2426 && ! TREE_CONSTANT (index_expr)
2427 && compare_tree_int (range, GET_MODE_BITSIZE (word_mode)) < 0
2428 && compare_tree_int (range, 0) > 0
2429 && lshift_cheap_p ()
2430 && ((uniq == 1 && count >= 3)
2431 || (uniq == 2 && count >= 5)
2432 || (uniq == 3 && count >= 6)))
2434 /* Optimize the case where all the case values fit in a
2435 word without having to subtract MINVAL. In this case,
2436 we can optimize away the subtraction. */
2437 if (compare_tree_int (minval, 0) > 0
2438 && compare_tree_int (maxval, GET_MODE_BITSIZE (word_mode)) < 0)
2440 minval = build_int_cst (index_type, 0);
2441 range = maxval;
2443 emit_case_bit_tests (index_type, index_expr, minval, range,
2444 case_list, default_label);
2447 /* If range of values is much bigger than number of values,
2448 make a sequence of conditional branches instead of a dispatch.
2449 If the switch-index is a constant, do it this way
2450 because we can optimize it. */
2452 else if (count < case_values_threshold ()
2453 || compare_tree_int (range,
2454 (optimize_size ? 3 : 10) * count) > 0
2455 /* RANGE may be signed, and really large ranges will show up
2456 as negative numbers. */
2457 || compare_tree_int (range, 0) < 0
2458 #ifndef ASM_OUTPUT_ADDR_DIFF_ELT
2459 || flag_pic
2460 #endif
2461 || !flag_jump_tables
2462 || TREE_CONSTANT (index_expr)
2463 /* If neither casesi or tablejump is available, we can
2464 only go this way. */
2465 || (!HAVE_casesi && !HAVE_tablejump))
2467 index = expand_expr (index_expr, NULL_RTX, VOIDmode, 0);
2469 /* If the index is a short or char that we do not have
2470 an insn to handle comparisons directly, convert it to
2471 a full integer now, rather than letting each comparison
2472 generate the conversion. */
2474 if (GET_MODE_CLASS (GET_MODE (index)) == MODE_INT
2475 && ! have_insn_for (COMPARE, GET_MODE (index)))
2477 enum machine_mode wider_mode;
2478 for (wider_mode = GET_MODE (index); wider_mode != VOIDmode;
2479 wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2480 if (have_insn_for (COMPARE, wider_mode))
2482 index = convert_to_mode (wider_mode, index, unsignedp);
2483 break;
2487 do_pending_stack_adjust ();
2489 if (MEM_P (index))
2490 index = copy_to_reg (index);
2492 /* We generate a binary decision tree to select the
2493 appropriate target code. This is done as follows:
2495 The list of cases is rearranged into a binary tree,
2496 nearly optimal assuming equal probability for each case.
2498 The tree is transformed into RTL, eliminating
2499 redundant test conditions at the same time.
2501 If program flow could reach the end of the
2502 decision tree an unconditional jump to the
2503 default code is emitted. */
2505 use_cost_table
2506 = (TREE_CODE (orig_type) != ENUMERAL_TYPE
2507 && estimate_case_costs (case_list));
2508 balance_case_nodes (&case_list, NULL);
2509 emit_case_nodes (index, case_list, default_label, index_type);
2510 emit_jump (default_label);
2512 else
2514 table_label = gen_label_rtx ();
2515 if (! try_casesi (index_type, index_expr, minval, range,
2516 table_label, default_label))
2518 bool ok;
2520 /* Index jumptables from zero for suitable values of
2521 minval to avoid a subtraction. */
2522 if (! optimize_size
2523 && compare_tree_int (minval, 0) > 0
2524 && compare_tree_int (minval, 3) < 0)
2526 minval = build_int_cst (index_type, 0);
2527 range = maxval;
2530 ok = try_tablejump (index_type, index_expr, minval, range,
2531 table_label, default_label);
2532 gcc_assert (ok);
2535 /* Get table of labels to jump to, in order of case index. */
2537 ncases = tree_low_cst (range, 0) + 1;
2538 labelvec = alloca (ncases * sizeof (rtx));
2539 memset (labelvec, 0, ncases * sizeof (rtx));
2541 for (n = case_list; n; n = n->right)
2543 /* Compute the low and high bounds relative to the minimum
2544 value since that should fit in a HOST_WIDE_INT while the
2545 actual values may not. */
2546 HOST_WIDE_INT i_low
2547 = tree_low_cst (fold_build2 (MINUS_EXPR, index_type,
2548 n->low, minval), 1);
2549 HOST_WIDE_INT i_high
2550 = tree_low_cst (fold_build2 (MINUS_EXPR, index_type,
2551 n->high, minval), 1);
2552 HOST_WIDE_INT i;
2554 for (i = i_low; i <= i_high; i ++)
2555 labelvec[i]
2556 = gen_rtx_LABEL_REF (Pmode, label_rtx (n->code_label));
2559 /* Fill in the gaps with the default. */
2560 for (i = 0; i < ncases; i++)
2561 if (labelvec[i] == 0)
2562 labelvec[i] = gen_rtx_LABEL_REF (Pmode, default_label);
2564 /* Output the table. */
2565 emit_label (table_label);
2567 if (CASE_VECTOR_PC_RELATIVE || flag_pic)
2568 emit_jump_insn (gen_rtx_ADDR_DIFF_VEC (CASE_VECTOR_MODE,
2569 gen_rtx_LABEL_REF (Pmode, table_label),
2570 gen_rtvec_v (ncases, labelvec),
2571 const0_rtx, const0_rtx));
2572 else
2573 emit_jump_insn (gen_rtx_ADDR_VEC (CASE_VECTOR_MODE,
2574 gen_rtvec_v (ncases, labelvec)));
2576 /* Record no drop-through after the table. */
2577 emit_barrier ();
2580 before_case = NEXT_INSN (before_case);
2581 end = get_last_insn ();
2582 fail = squeeze_notes (&before_case, &end);
2583 gcc_assert (!fail);
2584 reorder_insns (before_case, end, start);
2587 free_temp_slots ();
2590 /* Generate code to jump to LABEL if OP1 and OP2 are equal. */
2592 static void
2593 do_jump_if_equal (rtx op1, rtx op2, rtx label, int unsignedp)
2595 if (GET_CODE (op1) == CONST_INT && GET_CODE (op2) == CONST_INT)
2597 if (op1 == op2)
2598 emit_jump (label);
2600 else
2601 emit_cmp_and_jump_insns (op1, op2, EQ, NULL_RTX,
2602 (GET_MODE (op1) == VOIDmode
2603 ? GET_MODE (op2) : GET_MODE (op1)),
2604 unsignedp, label);
2607 /* Not all case values are encountered equally. This function
2608 uses a heuristic to weight case labels, in cases where that
2609 looks like a reasonable thing to do.
2611 Right now, all we try to guess is text, and we establish the
2612 following weights:
2614 chars above space: 16
2615 digits: 16
2616 default: 12
2617 space, punct: 8
2618 tab: 4
2619 newline: 2
2620 other "\" chars: 1
2621 remaining chars: 0
2623 If we find any cases in the switch that are not either -1 or in the range
2624 of valid ASCII characters, or are control characters other than those
2625 commonly used with "\", don't treat this switch scanning text.
2627 Return 1 if these nodes are suitable for cost estimation, otherwise
2628 return 0. */
2630 static int
2631 estimate_case_costs (case_node_ptr node)
2633 tree min_ascii = integer_minus_one_node;
2634 tree max_ascii = build_int_cst (TREE_TYPE (node->high), 127);
2635 case_node_ptr n;
2636 int i;
2638 /* If we haven't already made the cost table, make it now. Note that the
2639 lower bound of the table is -1, not zero. */
2641 if (! cost_table_initialized)
2643 cost_table_initialized = 1;
2645 for (i = 0; i < 128; i++)
2647 if (ISALNUM (i))
2648 COST_TABLE (i) = 16;
2649 else if (ISPUNCT (i))
2650 COST_TABLE (i) = 8;
2651 else if (ISCNTRL (i))
2652 COST_TABLE (i) = -1;
2655 COST_TABLE (' ') = 8;
2656 COST_TABLE ('\t') = 4;
2657 COST_TABLE ('\0') = 4;
2658 COST_TABLE ('\n') = 2;
2659 COST_TABLE ('\f') = 1;
2660 COST_TABLE ('\v') = 1;
2661 COST_TABLE ('\b') = 1;
2664 /* See if all the case expressions look like text. It is text if the
2665 constant is >= -1 and the highest constant is <= 127. Do all comparisons
2666 as signed arithmetic since we don't want to ever access cost_table with a
2667 value less than -1. Also check that none of the constants in a range
2668 are strange control characters. */
2670 for (n = node; n; n = n->right)
2672 if ((INT_CST_LT (n->low, min_ascii)) || INT_CST_LT (max_ascii, n->high))
2673 return 0;
2675 for (i = (HOST_WIDE_INT) TREE_INT_CST_LOW (n->low);
2676 i <= (HOST_WIDE_INT) TREE_INT_CST_LOW (n->high); i++)
2677 if (COST_TABLE (i) < 0)
2678 return 0;
2681 /* All interesting values are within the range of interesting
2682 ASCII characters. */
2683 return 1;
2686 /* Take an ordered list of case nodes
2687 and transform them into a near optimal binary tree,
2688 on the assumption that any target code selection value is as
2689 likely as any other.
2691 The transformation is performed by splitting the ordered
2692 list into two equal sections plus a pivot. The parts are
2693 then attached to the pivot as left and right branches. Each
2694 branch is then transformed recursively. */
2696 static void
2697 balance_case_nodes (case_node_ptr *head, case_node_ptr parent)
2699 case_node_ptr np;
2701 np = *head;
2702 if (np)
2704 int cost = 0;
2705 int i = 0;
2706 int ranges = 0;
2707 case_node_ptr *npp;
2708 case_node_ptr left;
2710 /* Count the number of entries on branch. Also count the ranges. */
2712 while (np)
2714 if (!tree_int_cst_equal (np->low, np->high))
2716 ranges++;
2717 if (use_cost_table)
2718 cost += COST_TABLE (TREE_INT_CST_LOW (np->high));
2721 if (use_cost_table)
2722 cost += COST_TABLE (TREE_INT_CST_LOW (np->low));
2724 i++;
2725 np = np->right;
2728 if (i > 2)
2730 /* Split this list if it is long enough for that to help. */
2731 npp = head;
2732 left = *npp;
2733 if (use_cost_table)
2735 /* Find the place in the list that bisects the list's total cost,
2736 Here I gets half the total cost. */
2737 int n_moved = 0;
2738 i = (cost + 1) / 2;
2739 while (1)
2741 /* Skip nodes while their cost does not reach that amount. */
2742 if (!tree_int_cst_equal ((*npp)->low, (*npp)->high))
2743 i -= COST_TABLE (TREE_INT_CST_LOW ((*npp)->high));
2744 i -= COST_TABLE (TREE_INT_CST_LOW ((*npp)->low));
2745 if (i <= 0)
2746 break;
2747 npp = &(*npp)->right;
2748 n_moved += 1;
2750 if (n_moved == 0)
2752 /* Leave this branch lopsided, but optimize left-hand
2753 side and fill in `parent' fields for right-hand side. */
2754 np = *head;
2755 np->parent = parent;
2756 balance_case_nodes (&np->left, np);
2757 for (; np->right; np = np->right)
2758 np->right->parent = np;
2759 return;
2762 /* If there are just three nodes, split at the middle one. */
2763 else if (i == 3)
2764 npp = &(*npp)->right;
2765 else
2767 /* Find the place in the list that bisects the list's total cost,
2768 where ranges count as 2.
2769 Here I gets half the total cost. */
2770 i = (i + ranges + 1) / 2;
2771 while (1)
2773 /* Skip nodes while their cost does not reach that amount. */
2774 if (!tree_int_cst_equal ((*npp)->low, (*npp)->high))
2775 i--;
2776 i--;
2777 if (i <= 0)
2778 break;
2779 npp = &(*npp)->right;
2782 *head = np = *npp;
2783 *npp = 0;
2784 np->parent = parent;
2785 np->left = left;
2787 /* Optimize each of the two split parts. */
2788 balance_case_nodes (&np->left, np);
2789 balance_case_nodes (&np->right, np);
2791 else
2793 /* Else leave this branch as one level,
2794 but fill in `parent' fields. */
2795 np = *head;
2796 np->parent = parent;
2797 for (; np->right; np = np->right)
2798 np->right->parent = np;
2803 /* Search the parent sections of the case node tree
2804 to see if a test for the lower bound of NODE would be redundant.
2805 INDEX_TYPE is the type of the index expression.
2807 The instructions to generate the case decision tree are
2808 output in the same order as nodes are processed so it is
2809 known that if a parent node checks the range of the current
2810 node minus one that the current node is bounded at its lower
2811 span. Thus the test would be redundant. */
2813 static int
2814 node_has_low_bound (case_node_ptr node, tree index_type)
2816 tree low_minus_one;
2817 case_node_ptr pnode;
2819 /* If the lower bound of this node is the lowest value in the index type,
2820 we need not test it. */
2822 if (tree_int_cst_equal (node->low, TYPE_MIN_VALUE (index_type)))
2823 return 1;
2825 /* If this node has a left branch, the value at the left must be less
2826 than that at this node, so it cannot be bounded at the bottom and
2827 we need not bother testing any further. */
2829 if (node->left)
2830 return 0;
2832 low_minus_one = fold_build2 (MINUS_EXPR, TREE_TYPE (node->low),
2833 node->low,
2834 build_int_cst (TREE_TYPE (node->low), 1));
2836 /* If the subtraction above overflowed, we can't verify anything.
2837 Otherwise, look for a parent that tests our value - 1. */
2839 if (! tree_int_cst_lt (low_minus_one, node->low))
2840 return 0;
2842 for (pnode = node->parent; pnode; pnode = pnode->parent)
2843 if (tree_int_cst_equal (low_minus_one, pnode->high))
2844 return 1;
2846 return 0;
2849 /* Search the parent sections of the case node tree
2850 to see if a test for the upper bound of NODE would be redundant.
2851 INDEX_TYPE is the type of the index expression.
2853 The instructions to generate the case decision tree are
2854 output in the same order as nodes are processed so it is
2855 known that if a parent node checks the range of the current
2856 node plus one that the current node is bounded at its upper
2857 span. Thus the test would be redundant. */
2859 static int
2860 node_has_high_bound (case_node_ptr node, tree index_type)
2862 tree high_plus_one;
2863 case_node_ptr pnode;
2865 /* If there is no upper bound, obviously no test is needed. */
2867 if (TYPE_MAX_VALUE (index_type) == NULL)
2868 return 1;
2870 /* If the upper bound of this node is the highest value in the type
2871 of the index expression, we need not test against it. */
2873 if (tree_int_cst_equal (node->high, TYPE_MAX_VALUE (index_type)))
2874 return 1;
2876 /* If this node has a right branch, the value at the right must be greater
2877 than that at this node, so it cannot be bounded at the top and
2878 we need not bother testing any further. */
2880 if (node->right)
2881 return 0;
2883 high_plus_one = fold_build2 (PLUS_EXPR, TREE_TYPE (node->high),
2884 node->high,
2885 build_int_cst (TREE_TYPE (node->high), 1));
2887 /* If the addition above overflowed, we can't verify anything.
2888 Otherwise, look for a parent that tests our value + 1. */
2890 if (! tree_int_cst_lt (node->high, high_plus_one))
2891 return 0;
2893 for (pnode = node->parent; pnode; pnode = pnode->parent)
2894 if (tree_int_cst_equal (high_plus_one, pnode->low))
2895 return 1;
2897 return 0;
2900 /* Search the parent sections of the
2901 case node tree to see if both tests for the upper and lower
2902 bounds of NODE would be redundant. */
2904 static int
2905 node_is_bounded (case_node_ptr node, tree index_type)
2907 return (node_has_low_bound (node, index_type)
2908 && node_has_high_bound (node, index_type));
2911 /* Emit step-by-step code to select a case for the value of INDEX.
2912 The thus generated decision tree follows the form of the
2913 case-node binary tree NODE, whose nodes represent test conditions.
2914 INDEX_TYPE is the type of the index of the switch.
2916 Care is taken to prune redundant tests from the decision tree
2917 by detecting any boundary conditions already checked by
2918 emitted rtx. (See node_has_high_bound, node_has_low_bound
2919 and node_is_bounded, above.)
2921 Where the test conditions can be shown to be redundant we emit
2922 an unconditional jump to the target code. As a further
2923 optimization, the subordinates of a tree node are examined to
2924 check for bounded nodes. In this case conditional and/or
2925 unconditional jumps as a result of the boundary check for the
2926 current node are arranged to target the subordinates associated
2927 code for out of bound conditions on the current node.
2929 We can assume that when control reaches the code generated here,
2930 the index value has already been compared with the parents
2931 of this node, and determined to be on the same side of each parent
2932 as this node is. Thus, if this node tests for the value 51,
2933 and a parent tested for 52, we don't need to consider
2934 the possibility of a value greater than 51. If another parent
2935 tests for the value 50, then this node need not test anything. */
2937 static void
2938 emit_case_nodes (rtx index, case_node_ptr node, rtx default_label,
2939 tree index_type)
2941 /* If INDEX has an unsigned type, we must make unsigned branches. */
2942 int unsignedp = TYPE_UNSIGNED (index_type);
2943 enum machine_mode mode = GET_MODE (index);
2944 enum machine_mode imode = TYPE_MODE (index_type);
2946 /* See if our parents have already tested everything for us.
2947 If they have, emit an unconditional jump for this node. */
2948 if (node_is_bounded (node, index_type))
2949 emit_jump (label_rtx (node->code_label));
2951 else if (tree_int_cst_equal (node->low, node->high))
2953 /* Node is single valued. First see if the index expression matches
2954 this node and then check our children, if any. */
2956 do_jump_if_equal (index,
2957 convert_modes (mode, imode,
2958 expand_expr (node->low, NULL_RTX,
2959 VOIDmode, 0),
2960 unsignedp),
2961 label_rtx (node->code_label), unsignedp);
2963 if (node->right != 0 && node->left != 0)
2965 /* This node has children on both sides.
2966 Dispatch to one side or the other
2967 by comparing the index value with this node's value.
2968 If one subtree is bounded, check that one first,
2969 so we can avoid real branches in the tree. */
2971 if (node_is_bounded (node->right, index_type))
2973 emit_cmp_and_jump_insns (index,
2974 convert_modes
2975 (mode, imode,
2976 expand_expr (node->high, NULL_RTX,
2977 VOIDmode, 0),
2978 unsignedp),
2979 GT, NULL_RTX, mode, unsignedp,
2980 label_rtx (node->right->code_label));
2981 emit_case_nodes (index, node->left, default_label, index_type);
2984 else if (node_is_bounded (node->left, index_type))
2986 emit_cmp_and_jump_insns (index,
2987 convert_modes
2988 (mode, imode,
2989 expand_expr (node->high, NULL_RTX,
2990 VOIDmode, 0),
2991 unsignedp),
2992 LT, NULL_RTX, mode, unsignedp,
2993 label_rtx (node->left->code_label));
2994 emit_case_nodes (index, node->right, default_label, index_type);
2997 /* If both children are single-valued cases with no
2998 children, finish up all the work. This way, we can save
2999 one ordered comparison. */
3000 else if (tree_int_cst_equal (node->right->low, node->right->high)
3001 && node->right->left == 0
3002 && node->right->right == 0
3003 && tree_int_cst_equal (node->left->low, node->left->high)
3004 && node->left->left == 0
3005 && node->left->right == 0)
3007 /* Neither node is bounded. First distinguish the two sides;
3008 then emit the code for one side at a time. */
3010 /* See if the value matches what the right hand side
3011 wants. */
3012 do_jump_if_equal (index,
3013 convert_modes (mode, imode,
3014 expand_expr (node->right->low,
3015 NULL_RTX,
3016 VOIDmode, 0),
3017 unsignedp),
3018 label_rtx (node->right->code_label),
3019 unsignedp);
3021 /* See if the value matches what the left hand side
3022 wants. */
3023 do_jump_if_equal (index,
3024 convert_modes (mode, imode,
3025 expand_expr (node->left->low,
3026 NULL_RTX,
3027 VOIDmode, 0),
3028 unsignedp),
3029 label_rtx (node->left->code_label),
3030 unsignedp);
3033 else
3035 /* Neither node is bounded. First distinguish the two sides;
3036 then emit the code for one side at a time. */
3038 tree test_label = build_decl (LABEL_DECL, NULL_TREE, NULL_TREE);
3040 /* See if the value is on the right. */
3041 emit_cmp_and_jump_insns (index,
3042 convert_modes
3043 (mode, imode,
3044 expand_expr (node->high, NULL_RTX,
3045 VOIDmode, 0),
3046 unsignedp),
3047 GT, NULL_RTX, mode, unsignedp,
3048 label_rtx (test_label));
3050 /* Value must be on the left.
3051 Handle the left-hand subtree. */
3052 emit_case_nodes (index, node->left, default_label, index_type);
3053 /* If left-hand subtree does nothing,
3054 go to default. */
3055 emit_jump (default_label);
3057 /* Code branches here for the right-hand subtree. */
3058 expand_label (test_label);
3059 emit_case_nodes (index, node->right, default_label, index_type);
3063 else if (node->right != 0 && node->left == 0)
3065 /* Here we have a right child but no left so we issue a conditional
3066 branch to default and process the right child.
3068 Omit the conditional branch to default if the right child
3069 does not have any children and is single valued; it would
3070 cost too much space to save so little time. */
3072 if (node->right->right || node->right->left
3073 || !tree_int_cst_equal (node->right->low, node->right->high))
3075 if (!node_has_low_bound (node, index_type))
3077 emit_cmp_and_jump_insns (index,
3078 convert_modes
3079 (mode, imode,
3080 expand_expr (node->high, NULL_RTX,
3081 VOIDmode, 0),
3082 unsignedp),
3083 LT, NULL_RTX, mode, unsignedp,
3084 default_label);
3087 emit_case_nodes (index, node->right, default_label, index_type);
3089 else
3090 /* We cannot process node->right normally
3091 since we haven't ruled out the numbers less than
3092 this node's value. So handle node->right explicitly. */
3093 do_jump_if_equal (index,
3094 convert_modes
3095 (mode, imode,
3096 expand_expr (node->right->low, NULL_RTX,
3097 VOIDmode, 0),
3098 unsignedp),
3099 label_rtx (node->right->code_label), unsignedp);
3102 else if (node->right == 0 && node->left != 0)
3104 /* Just one subtree, on the left. */
3105 if (node->left->left || node->left->right
3106 || !tree_int_cst_equal (node->left->low, node->left->high))
3108 if (!node_has_high_bound (node, index_type))
3110 emit_cmp_and_jump_insns (index,
3111 convert_modes
3112 (mode, imode,
3113 expand_expr (node->high, NULL_RTX,
3114 VOIDmode, 0),
3115 unsignedp),
3116 GT, NULL_RTX, mode, unsignedp,
3117 default_label);
3120 emit_case_nodes (index, node->left, default_label, index_type);
3122 else
3123 /* We cannot process node->left normally
3124 since we haven't ruled out the numbers less than
3125 this node's value. So handle node->left explicitly. */
3126 do_jump_if_equal (index,
3127 convert_modes
3128 (mode, imode,
3129 expand_expr (node->left->low, NULL_RTX,
3130 VOIDmode, 0),
3131 unsignedp),
3132 label_rtx (node->left->code_label), unsignedp);
3135 else
3137 /* Node is a range. These cases are very similar to those for a single
3138 value, except that we do not start by testing whether this node
3139 is the one to branch to. */
3141 if (node->right != 0 && node->left != 0)
3143 /* Node has subtrees on both sides.
3144 If the right-hand subtree is bounded,
3145 test for it first, since we can go straight there.
3146 Otherwise, we need to make a branch in the control structure,
3147 then handle the two subtrees. */
3148 tree test_label = 0;
3150 if (node_is_bounded (node->right, index_type))
3151 /* Right hand node is fully bounded so we can eliminate any
3152 testing and branch directly to the target code. */
3153 emit_cmp_and_jump_insns (index,
3154 convert_modes
3155 (mode, imode,
3156 expand_expr (node->high, NULL_RTX,
3157 VOIDmode, 0),
3158 unsignedp),
3159 GT, NULL_RTX, mode, unsignedp,
3160 label_rtx (node->right->code_label));
3161 else
3163 /* Right hand node requires testing.
3164 Branch to a label where we will handle it later. */
3166 test_label = build_decl (LABEL_DECL, NULL_TREE, NULL_TREE);
3167 emit_cmp_and_jump_insns (index,
3168 convert_modes
3169 (mode, imode,
3170 expand_expr (node->high, NULL_RTX,
3171 VOIDmode, 0),
3172 unsignedp),
3173 GT, NULL_RTX, mode, unsignedp,
3174 label_rtx (test_label));
3177 /* Value belongs to this node or to the left-hand subtree. */
3179 emit_cmp_and_jump_insns (index,
3180 convert_modes
3181 (mode, imode,
3182 expand_expr (node->low, NULL_RTX,
3183 VOIDmode, 0),
3184 unsignedp),
3185 GE, NULL_RTX, mode, unsignedp,
3186 label_rtx (node->code_label));
3188 /* Handle the left-hand subtree. */
3189 emit_case_nodes (index, node->left, default_label, index_type);
3191 /* If right node had to be handled later, do that now. */
3193 if (test_label)
3195 /* If the left-hand subtree fell through,
3196 don't let it fall into the right-hand subtree. */
3197 emit_jump (default_label);
3199 expand_label (test_label);
3200 emit_case_nodes (index, node->right, default_label, index_type);
3204 else if (node->right != 0 && node->left == 0)
3206 /* Deal with values to the left of this node,
3207 if they are possible. */
3208 if (!node_has_low_bound (node, index_type))
3210 emit_cmp_and_jump_insns (index,
3211 convert_modes
3212 (mode, imode,
3213 expand_expr (node->low, NULL_RTX,
3214 VOIDmode, 0),
3215 unsignedp),
3216 LT, NULL_RTX, mode, unsignedp,
3217 default_label);
3220 /* Value belongs to this node or to the right-hand subtree. */
3222 emit_cmp_and_jump_insns (index,
3223 convert_modes
3224 (mode, imode,
3225 expand_expr (node->high, NULL_RTX,
3226 VOIDmode, 0),
3227 unsignedp),
3228 LE, NULL_RTX, mode, unsignedp,
3229 label_rtx (node->code_label));
3231 emit_case_nodes (index, node->right, default_label, index_type);
3234 else if (node->right == 0 && node->left != 0)
3236 /* Deal with values to the right of this node,
3237 if they are possible. */
3238 if (!node_has_high_bound (node, index_type))
3240 emit_cmp_and_jump_insns (index,
3241 convert_modes
3242 (mode, imode,
3243 expand_expr (node->high, NULL_RTX,
3244 VOIDmode, 0),
3245 unsignedp),
3246 GT, NULL_RTX, mode, unsignedp,
3247 default_label);
3250 /* Value belongs to this node or to the left-hand subtree. */
3252 emit_cmp_and_jump_insns (index,
3253 convert_modes
3254 (mode, imode,
3255 expand_expr (node->low, NULL_RTX,
3256 VOIDmode, 0),
3257 unsignedp),
3258 GE, NULL_RTX, mode, unsignedp,
3259 label_rtx (node->code_label));
3261 emit_case_nodes (index, node->left, default_label, index_type);
3264 else
3266 /* Node has no children so we check low and high bounds to remove
3267 redundant tests. Only one of the bounds can exist,
3268 since otherwise this node is bounded--a case tested already. */
3269 int high_bound = node_has_high_bound (node, index_type);
3270 int low_bound = node_has_low_bound (node, index_type);
3272 if (!high_bound && low_bound)
3274 emit_cmp_and_jump_insns (index,
3275 convert_modes
3276 (mode, imode,
3277 expand_expr (node->high, NULL_RTX,
3278 VOIDmode, 0),
3279 unsignedp),
3280 GT, NULL_RTX, mode, unsignedp,
3281 default_label);
3284 else if (!low_bound && high_bound)
3286 emit_cmp_and_jump_insns (index,
3287 convert_modes
3288 (mode, imode,
3289 expand_expr (node->low, NULL_RTX,
3290 VOIDmode, 0),
3291 unsignedp),
3292 LT, NULL_RTX, mode, unsignedp,
3293 default_label);
3295 else if (!low_bound && !high_bound)
3297 /* Widen LOW and HIGH to the same width as INDEX. */
3298 tree type = lang_hooks.types.type_for_mode (mode, unsignedp);
3299 tree low = build1 (CONVERT_EXPR, type, node->low);
3300 tree high = build1 (CONVERT_EXPR, type, node->high);
3301 rtx low_rtx, new_index, new_bound;
3303 /* Instead of doing two branches, emit one unsigned branch for
3304 (index-low) > (high-low). */
3305 low_rtx = expand_expr (low, NULL_RTX, mode, 0);
3306 new_index = expand_simple_binop (mode, MINUS, index, low_rtx,
3307 NULL_RTX, unsignedp,
3308 OPTAB_WIDEN);
3309 new_bound = expand_expr (fold_build2 (MINUS_EXPR, type,
3310 high, low),
3311 NULL_RTX, mode, 0);
3313 emit_cmp_and_jump_insns (new_index, new_bound, GT, NULL_RTX,
3314 mode, 1, default_label);
3317 emit_jump (label_rtx (node->code_label));