* config/xtensa/xtensa.c (function_arg_boundary): New.
[official-gcc.git] / gcc / config / xtensa / xtensa.c
blob836ae2e1687a70e9c92068c7446e376e5e879e56
1 /* Subroutines for insn-output.c for Tensilica's Xtensa architecture.
2 Copyright 2001, 2002, 2003, 2004, 2005, 2006 Free Software Foundation, Inc.
3 Contributed by Bob Wilson (bwilson@tensilica.com) at Tensilica.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to the Free
19 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
20 02110-1301, USA. */
22 #include "config.h"
23 #include "system.h"
24 #include "coretypes.h"
25 #include "tm.h"
26 #include "rtl.h"
27 #include "regs.h"
28 #include "hard-reg-set.h"
29 #include "basic-block.h"
30 #include "real.h"
31 #include "insn-config.h"
32 #include "conditions.h"
33 #include "insn-flags.h"
34 #include "insn-attr.h"
35 #include "insn-codes.h"
36 #include "recog.h"
37 #include "output.h"
38 #include "tree.h"
39 #include "expr.h"
40 #include "flags.h"
41 #include "reload.h"
42 #include "tm_p.h"
43 #include "function.h"
44 #include "toplev.h"
45 #include "optabs.h"
46 #include "libfuncs.h"
47 #include "ggc.h"
48 #include "target.h"
49 #include "target-def.h"
50 #include "langhooks.h"
51 #include "tree-gimple.h"
54 /* Enumeration for all of the relational tests, so that we can build
55 arrays indexed by the test type, and not worry about the order
56 of EQ, NE, etc. */
58 enum internal_test
60 ITEST_EQ,
61 ITEST_NE,
62 ITEST_GT,
63 ITEST_GE,
64 ITEST_LT,
65 ITEST_LE,
66 ITEST_GTU,
67 ITEST_GEU,
68 ITEST_LTU,
69 ITEST_LEU,
70 ITEST_MAX
73 /* Cached operands, and operator to compare for use in set/branch on
74 condition codes. */
75 rtx branch_cmp[2];
77 /* what type of branch to use */
78 enum cmp_type branch_type;
80 /* Array giving truth value on whether or not a given hard register
81 can support a given mode. */
82 char xtensa_hard_regno_mode_ok[(int) MAX_MACHINE_MODE][FIRST_PSEUDO_REGISTER];
84 /* Current frame size calculated by compute_frame_size. */
85 unsigned xtensa_current_frame_size;
87 /* Largest block move to handle in-line. */
88 #define LARGEST_MOVE_RATIO 15
90 /* Define the structure for the machine field in struct function. */
91 struct machine_function GTY(())
93 int accesses_prev_frame;
94 bool need_a7_copy;
95 bool vararg_a7;
96 rtx set_frame_ptr_insn;
99 /* Vector, indexed by hard register number, which contains 1 for a
100 register that is allowable in a candidate for leaf function
101 treatment. */
103 const char xtensa_leaf_regs[FIRST_PSEUDO_REGISTER] =
105 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
106 1, 1, 1,
107 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
111 /* Map hard register number to register class */
112 const enum reg_class xtensa_regno_to_class[FIRST_PSEUDO_REGISTER] =
114 RL_REGS, SP_REG, RL_REGS, RL_REGS,
115 RL_REGS, RL_REGS, RL_REGS, GR_REGS,
116 RL_REGS, RL_REGS, RL_REGS, RL_REGS,
117 RL_REGS, RL_REGS, RL_REGS, RL_REGS,
118 AR_REGS, AR_REGS, BR_REGS,
119 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
120 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
121 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
122 FP_REGS, FP_REGS, FP_REGS, FP_REGS,
123 ACC_REG,
126 /* Map register constraint character to register class. */
127 enum reg_class xtensa_char_to_class[256] =
129 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
130 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
131 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
132 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
133 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
134 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
135 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
136 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
137 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
138 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
139 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
140 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
141 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
142 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
143 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
144 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
145 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
146 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
147 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
148 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
149 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
150 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
151 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
152 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
153 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
154 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
155 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
156 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
157 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
158 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
159 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
160 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
161 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
162 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
163 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
164 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
165 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
166 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
167 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
168 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
169 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
170 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
171 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
172 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
173 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
174 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
175 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
176 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
177 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
178 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
179 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
180 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
181 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
182 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
183 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
184 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
185 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
186 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
187 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
188 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
189 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
190 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
191 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
192 NO_REGS, NO_REGS, NO_REGS, NO_REGS,
195 static enum internal_test map_test_to_internal_test (enum rtx_code);
196 static rtx gen_int_relational (enum rtx_code, rtx, rtx, int *);
197 static rtx gen_float_relational (enum rtx_code, rtx, rtx);
198 static rtx gen_conditional_move (rtx);
199 static rtx fixup_subreg_mem (rtx);
200 static struct machine_function * xtensa_init_machine_status (void);
201 static bool xtensa_return_in_msb (tree);
202 static void printx (FILE *, signed int);
203 static void xtensa_function_epilogue (FILE *, HOST_WIDE_INT);
204 static rtx xtensa_builtin_saveregs (void);
205 static unsigned int xtensa_multibss_section_type_flags (tree, const char *,
206 int) ATTRIBUTE_UNUSED;
207 static section *xtensa_select_rtx_section (enum machine_mode, rtx,
208 unsigned HOST_WIDE_INT);
209 static bool xtensa_rtx_costs (rtx, int, int, int *);
210 static tree xtensa_build_builtin_va_list (void);
211 static bool xtensa_return_in_memory (tree, tree);
212 static tree xtensa_gimplify_va_arg_expr (tree, tree, tree *, tree *);
214 static const int reg_nonleaf_alloc_order[FIRST_PSEUDO_REGISTER] =
215 REG_ALLOC_ORDER;
218 /* This macro generates the assembly code for function exit,
219 on machines that need it. If FUNCTION_EPILOGUE is not defined
220 then individual return instructions are generated for each
221 return statement. Args are same as for FUNCTION_PROLOGUE. */
223 #undef TARGET_ASM_FUNCTION_EPILOGUE
224 #define TARGET_ASM_FUNCTION_EPILOGUE xtensa_function_epilogue
226 /* These hooks specify assembly directives for creating certain kinds
227 of integer object. */
229 #undef TARGET_ASM_ALIGNED_SI_OP
230 #define TARGET_ASM_ALIGNED_SI_OP "\t.word\t"
232 #undef TARGET_ASM_SELECT_RTX_SECTION
233 #define TARGET_ASM_SELECT_RTX_SECTION xtensa_select_rtx_section
235 #undef TARGET_DEFAULT_TARGET_FLAGS
236 #define TARGET_DEFAULT_TARGET_FLAGS (TARGET_DEFAULT | MASK_FUSED_MADD)
238 #undef TARGET_RTX_COSTS
239 #define TARGET_RTX_COSTS xtensa_rtx_costs
240 #undef TARGET_ADDRESS_COST
241 #define TARGET_ADDRESS_COST hook_int_rtx_0
243 #undef TARGET_BUILD_BUILTIN_VA_LIST
244 #define TARGET_BUILD_BUILTIN_VA_LIST xtensa_build_builtin_va_list
246 #undef TARGET_PROMOTE_FUNCTION_ARGS
247 #define TARGET_PROMOTE_FUNCTION_ARGS hook_bool_tree_true
248 #undef TARGET_PROMOTE_FUNCTION_RETURN
249 #define TARGET_PROMOTE_FUNCTION_RETURN hook_bool_tree_true
250 #undef TARGET_PROMOTE_PROTOTYPES
251 #define TARGET_PROMOTE_PROTOTYPES hook_bool_tree_true
253 #undef TARGET_RETURN_IN_MEMORY
254 #define TARGET_RETURN_IN_MEMORY xtensa_return_in_memory
255 #undef TARGET_SPLIT_COMPLEX_ARG
256 #define TARGET_SPLIT_COMPLEX_ARG hook_bool_tree_true
257 #undef TARGET_MUST_PASS_IN_STACK
258 #define TARGET_MUST_PASS_IN_STACK must_pass_in_stack_var_size
260 #undef TARGET_EXPAND_BUILTIN_SAVEREGS
261 #define TARGET_EXPAND_BUILTIN_SAVEREGS xtensa_builtin_saveregs
262 #undef TARGET_GIMPLIFY_VA_ARG_EXPR
263 #define TARGET_GIMPLIFY_VA_ARG_EXPR xtensa_gimplify_va_arg_expr
265 #undef TARGET_RETURN_IN_MSB
266 #define TARGET_RETURN_IN_MSB xtensa_return_in_msb
268 struct gcc_target targetm = TARGET_INITIALIZER;
272 * Functions to test Xtensa immediate operand validity.
275 bool
276 xtensa_simm8 (HOST_WIDE_INT v)
278 return v >= -128 && v <= 127;
282 bool
283 xtensa_simm8x256 (HOST_WIDE_INT v)
285 return (v & 255) == 0 && (v >= -32768 && v <= 32512);
289 bool
290 xtensa_simm12b (HOST_WIDE_INT v)
292 return v >= -2048 && v <= 2047;
296 static bool
297 xtensa_uimm8 (HOST_WIDE_INT v)
299 return v >= 0 && v <= 255;
303 static bool
304 xtensa_uimm8x2 (HOST_WIDE_INT v)
306 return (v & 1) == 0 && (v >= 0 && v <= 510);
310 static bool
311 xtensa_uimm8x4 (HOST_WIDE_INT v)
313 return (v & 3) == 0 && (v >= 0 && v <= 1020);
317 static bool
318 xtensa_b4const (HOST_WIDE_INT v)
320 switch (v)
322 case -1:
323 case 1:
324 case 2:
325 case 3:
326 case 4:
327 case 5:
328 case 6:
329 case 7:
330 case 8:
331 case 10:
332 case 12:
333 case 16:
334 case 32:
335 case 64:
336 case 128:
337 case 256:
338 return true;
340 return false;
344 bool
345 xtensa_b4const_or_zero (HOST_WIDE_INT v)
347 if (v == 0)
348 return true;
349 return xtensa_b4const (v);
353 bool
354 xtensa_b4constu (HOST_WIDE_INT v)
356 switch (v)
358 case 32768:
359 case 65536:
360 case 2:
361 case 3:
362 case 4:
363 case 5:
364 case 6:
365 case 7:
366 case 8:
367 case 10:
368 case 12:
369 case 16:
370 case 32:
371 case 64:
372 case 128:
373 case 256:
374 return true;
376 return false;
380 bool
381 xtensa_mask_immediate (HOST_WIDE_INT v)
383 #define MAX_MASK_SIZE 16
384 int mask_size;
386 for (mask_size = 1; mask_size <= MAX_MASK_SIZE; mask_size++)
388 if ((v & 1) == 0)
389 return false;
390 v = v >> 1;
391 if (v == 0)
392 return true;
395 return false;
399 bool
400 xtensa_const_ok_for_letter_p (HOST_WIDE_INT v, int c)
402 switch (c)
404 case 'I': return xtensa_simm12b (v);
405 case 'J': return xtensa_simm8 (v);
406 case 'K': return (v == 0 || xtensa_b4const (v));
407 case 'L': return xtensa_b4constu (v);
408 case 'M': return (v >= -32 && v <= 95);
409 case 'N': return xtensa_simm8x256 (v);
410 case 'O': return (v == -1 || (v >= 1 && v <= 15));
411 case 'P': return xtensa_mask_immediate (v);
412 default: break;
414 return false;
418 /* This is just like the standard true_regnum() function except that it
419 works even when reg_renumber is not initialized. */
422 xt_true_regnum (rtx x)
424 if (GET_CODE (x) == REG)
426 if (reg_renumber
427 && REGNO (x) >= FIRST_PSEUDO_REGISTER
428 && reg_renumber[REGNO (x)] >= 0)
429 return reg_renumber[REGNO (x)];
430 return REGNO (x);
432 if (GET_CODE (x) == SUBREG)
434 int base = xt_true_regnum (SUBREG_REG (x));
435 if (base >= 0 && base < FIRST_PSEUDO_REGISTER)
436 return base + subreg_regno_offset (REGNO (SUBREG_REG (x)),
437 GET_MODE (SUBREG_REG (x)),
438 SUBREG_BYTE (x), GET_MODE (x));
440 return -1;
445 xtensa_valid_move (enum machine_mode mode, rtx *operands)
447 /* Either the destination or source must be a register, and the
448 MAC16 accumulator doesn't count. */
450 if (register_operand (operands[0], mode))
452 int dst_regnum = xt_true_regnum (operands[0]);
454 /* The stack pointer can only be assigned with a MOVSP opcode. */
455 if (dst_regnum == STACK_POINTER_REGNUM)
456 return (mode == SImode
457 && register_operand (operands[1], mode)
458 && !ACC_REG_P (xt_true_regnum (operands[1])));
460 if (!ACC_REG_P (dst_regnum))
461 return true;
463 if (register_operand (operands[1], mode))
465 int src_regnum = xt_true_regnum (operands[1]);
466 if (!ACC_REG_P (src_regnum))
467 return true;
469 return FALSE;
474 smalloffset_mem_p (rtx op)
476 if (GET_CODE (op) == MEM)
478 rtx addr = XEXP (op, 0);
479 if (GET_CODE (addr) == REG)
480 return REG_OK_FOR_BASE_P (addr);
481 if (GET_CODE (addr) == PLUS)
483 rtx offset = XEXP (addr, 0);
484 HOST_WIDE_INT val;
485 if (GET_CODE (offset) != CONST_INT)
486 offset = XEXP (addr, 1);
487 if (GET_CODE (offset) != CONST_INT)
488 return FALSE;
490 val = INTVAL (offset);
491 return (val & 3) == 0 && (val >= 0 && val <= 60);
494 return FALSE;
499 constantpool_address_p (rtx addr)
501 rtx sym = addr;
503 if (GET_CODE (addr) == CONST)
505 rtx offset;
507 /* Only handle (PLUS (SYM, OFFSET)) form. */
508 addr = XEXP (addr, 0);
509 if (GET_CODE (addr) != PLUS)
510 return FALSE;
512 /* Make sure the address is word aligned. */
513 offset = XEXP (addr, 1);
514 if ((GET_CODE (offset) != CONST_INT)
515 || ((INTVAL (offset) & 3) != 0))
516 return FALSE;
518 sym = XEXP (addr, 0);
521 if ((GET_CODE (sym) == SYMBOL_REF)
522 && CONSTANT_POOL_ADDRESS_P (sym))
523 return TRUE;
524 return FALSE;
529 constantpool_mem_p (rtx op)
531 if (GET_CODE (op) == MEM)
532 return constantpool_address_p (XEXP (op, 0));
533 return FALSE;
537 void
538 xtensa_extend_reg (rtx dst, rtx src)
540 rtx temp = gen_reg_rtx (SImode);
541 rtx shift = GEN_INT (BITS_PER_WORD - GET_MODE_BITSIZE (GET_MODE (src)));
543 /* Generate paradoxical subregs as needed so that the modes match. */
544 src = simplify_gen_subreg (SImode, src, GET_MODE (src), 0);
545 dst = simplify_gen_subreg (SImode, dst, GET_MODE (dst), 0);
547 emit_insn (gen_ashlsi3 (temp, src, shift));
548 emit_insn (gen_ashrsi3 (dst, temp, shift));
552 bool
553 xtensa_mem_offset (unsigned v, enum machine_mode mode)
555 switch (mode)
557 case BLKmode:
558 /* Handle the worst case for block moves. See xtensa_expand_block_move
559 where we emit an optimized block move operation if the block can be
560 moved in < "move_ratio" pieces. The worst case is when the block is
561 aligned but has a size of (3 mod 4) (does this happen?) so that the
562 last piece requires a byte load/store. */
563 return (xtensa_uimm8 (v)
564 && xtensa_uimm8 (v + MOVE_MAX * LARGEST_MOVE_RATIO));
566 case QImode:
567 return xtensa_uimm8 (v);
569 case HImode:
570 return xtensa_uimm8x2 (v);
572 case DFmode:
573 return (xtensa_uimm8x4 (v) && xtensa_uimm8x4 (v + 4));
575 default:
576 break;
579 return xtensa_uimm8x4 (v);
583 bool
584 xtensa_extra_constraint (rtx op, int c)
586 /* Allow pseudo registers during reload. */
587 if (GET_CODE (op) != MEM)
588 return (c >= 'R' && c <= 'U'
589 && reload_in_progress && GET_CODE (op) == REG
590 && REGNO (op) >= FIRST_PSEUDO_REGISTER);
592 switch (c)
594 case 'R': return smalloffset_mem_p (op);
595 case 'T': return !TARGET_CONST16 && constantpool_mem_p (op);
596 case 'U': return !constantpool_mem_p (op);
597 default: break;
599 return false;
603 /* Make normal rtx_code into something we can index from an array. */
605 static enum internal_test
606 map_test_to_internal_test (enum rtx_code test_code)
608 enum internal_test test = ITEST_MAX;
610 switch (test_code)
612 default: break;
613 case EQ: test = ITEST_EQ; break;
614 case NE: test = ITEST_NE; break;
615 case GT: test = ITEST_GT; break;
616 case GE: test = ITEST_GE; break;
617 case LT: test = ITEST_LT; break;
618 case LE: test = ITEST_LE; break;
619 case GTU: test = ITEST_GTU; break;
620 case GEU: test = ITEST_GEU; break;
621 case LTU: test = ITEST_LTU; break;
622 case LEU: test = ITEST_LEU; break;
625 return test;
629 /* Generate the code to compare two integer values. The return value is
630 the comparison expression. */
632 static rtx
633 gen_int_relational (enum rtx_code test_code, /* relational test (EQ, etc) */
634 rtx cmp0, /* first operand to compare */
635 rtx cmp1, /* second operand to compare */
636 int *p_invert /* whether branch needs to reverse test */)
638 struct cmp_info
640 enum rtx_code test_code; /* test code to use in insn */
641 bool (*const_range_p) (HOST_WIDE_INT); /* range check function */
642 int const_add; /* constant to add (convert LE -> LT) */
643 int reverse_regs; /* reverse registers in test */
644 int invert_const; /* != 0 if invert value if cmp1 is constant */
645 int invert_reg; /* != 0 if invert value if cmp1 is register */
646 int unsignedp; /* != 0 for unsigned comparisons. */
649 static struct cmp_info info[ (int)ITEST_MAX ] = {
651 { EQ, xtensa_b4const_or_zero, 0, 0, 0, 0, 0 }, /* EQ */
652 { NE, xtensa_b4const_or_zero, 0, 0, 0, 0, 0 }, /* NE */
654 { LT, xtensa_b4const_or_zero, 1, 1, 1, 0, 0 }, /* GT */
655 { GE, xtensa_b4const_or_zero, 0, 0, 0, 0, 0 }, /* GE */
656 { LT, xtensa_b4const_or_zero, 0, 0, 0, 0, 0 }, /* LT */
657 { GE, xtensa_b4const_or_zero, 1, 1, 1, 0, 0 }, /* LE */
659 { LTU, xtensa_b4constu, 1, 1, 1, 0, 1 }, /* GTU */
660 { GEU, xtensa_b4constu, 0, 0, 0, 0, 1 }, /* GEU */
661 { LTU, xtensa_b4constu, 0, 0, 0, 0, 1 }, /* LTU */
662 { GEU, xtensa_b4constu, 1, 1, 1, 0, 1 }, /* LEU */
665 enum internal_test test;
666 enum machine_mode mode;
667 struct cmp_info *p_info;
669 test = map_test_to_internal_test (test_code);
670 gcc_assert (test != ITEST_MAX);
672 p_info = &info[ (int)test ];
674 mode = GET_MODE (cmp0);
675 if (mode == VOIDmode)
676 mode = GET_MODE (cmp1);
678 /* Make sure we can handle any constants given to us. */
679 if (GET_CODE (cmp1) == CONST_INT)
681 HOST_WIDE_INT value = INTVAL (cmp1);
682 unsigned HOST_WIDE_INT uvalue = (unsigned HOST_WIDE_INT)value;
684 /* if the immediate overflows or does not fit in the immediate field,
685 spill it to a register */
687 if ((p_info->unsignedp ?
688 (uvalue + p_info->const_add > uvalue) :
689 (value + p_info->const_add > value)) != (p_info->const_add > 0))
691 cmp1 = force_reg (mode, cmp1);
693 else if (!(p_info->const_range_p) (value + p_info->const_add))
695 cmp1 = force_reg (mode, cmp1);
698 else if ((GET_CODE (cmp1) != REG) && (GET_CODE (cmp1) != SUBREG))
700 cmp1 = force_reg (mode, cmp1);
703 /* See if we need to invert the result. */
704 *p_invert = ((GET_CODE (cmp1) == CONST_INT)
705 ? p_info->invert_const
706 : p_info->invert_reg);
708 /* Comparison to constants, may involve adding 1 to change a LT into LE.
709 Comparison between two registers, may involve switching operands. */
710 if (GET_CODE (cmp1) == CONST_INT)
712 if (p_info->const_add != 0)
713 cmp1 = GEN_INT (INTVAL (cmp1) + p_info->const_add);
716 else if (p_info->reverse_regs)
718 rtx temp = cmp0;
719 cmp0 = cmp1;
720 cmp1 = temp;
723 return gen_rtx_fmt_ee (p_info->test_code, VOIDmode, cmp0, cmp1);
727 /* Generate the code to compare two float values. The return value is
728 the comparison expression. */
730 static rtx
731 gen_float_relational (enum rtx_code test_code, /* relational test (EQ, etc) */
732 rtx cmp0, /* first operand to compare */
733 rtx cmp1 /* second operand to compare */)
735 rtx (*gen_fn) (rtx, rtx, rtx);
736 rtx brtmp;
737 int reverse_regs, invert;
739 switch (test_code)
741 case EQ: reverse_regs = 0; invert = 0; gen_fn = gen_seq_sf; break;
742 case NE: reverse_regs = 0; invert = 1; gen_fn = gen_seq_sf; break;
743 case LE: reverse_regs = 0; invert = 0; gen_fn = gen_sle_sf; break;
744 case GT: reverse_regs = 1; invert = 0; gen_fn = gen_slt_sf; break;
745 case LT: reverse_regs = 0; invert = 0; gen_fn = gen_slt_sf; break;
746 case GE: reverse_regs = 1; invert = 0; gen_fn = gen_sle_sf; break;
747 default:
748 fatal_insn ("bad test", gen_rtx_fmt_ee (test_code, VOIDmode, cmp0, cmp1));
749 reverse_regs = 0; invert = 0; gen_fn = 0; /* avoid compiler warnings */
752 if (reverse_regs)
754 rtx temp = cmp0;
755 cmp0 = cmp1;
756 cmp1 = temp;
759 brtmp = gen_rtx_REG (CCmode, FPCC_REGNUM);
760 emit_insn (gen_fn (brtmp, cmp0, cmp1));
762 return gen_rtx_fmt_ee (invert ? EQ : NE, VOIDmode, brtmp, const0_rtx);
766 void
767 xtensa_expand_conditional_branch (rtx *operands, enum rtx_code test_code)
769 enum cmp_type type = branch_type;
770 rtx cmp0 = branch_cmp[0];
771 rtx cmp1 = branch_cmp[1];
772 rtx cmp;
773 int invert;
774 rtx label1, label2;
776 switch (type)
778 case CMP_DF:
779 default:
780 fatal_insn ("bad test", gen_rtx_fmt_ee (test_code, VOIDmode, cmp0, cmp1));
782 case CMP_SI:
783 invert = FALSE;
784 cmp = gen_int_relational (test_code, cmp0, cmp1, &invert);
785 break;
787 case CMP_SF:
788 if (!TARGET_HARD_FLOAT)
789 fatal_insn ("bad test", gen_rtx_fmt_ee (test_code, VOIDmode, cmp0, cmp1));
790 invert = FALSE;
791 cmp = gen_float_relational (test_code, cmp0, cmp1);
792 break;
795 /* Generate the branch. */
797 label1 = gen_rtx_LABEL_REF (VOIDmode, operands[0]);
798 label2 = pc_rtx;
800 if (invert)
802 label2 = label1;
803 label1 = pc_rtx;
806 emit_jump_insn (gen_rtx_SET (VOIDmode, pc_rtx,
807 gen_rtx_IF_THEN_ELSE (VOIDmode, cmp,
808 label1,
809 label2)));
813 static rtx
814 gen_conditional_move (rtx cmp)
816 enum rtx_code code = GET_CODE (cmp);
817 rtx op0 = branch_cmp[0];
818 rtx op1 = branch_cmp[1];
820 if (branch_type == CMP_SI)
822 /* Jump optimization calls get_condition() which canonicalizes
823 comparisons like (GE x <const>) to (GT x <const-1>).
824 Transform those comparisons back to GE, since that is the
825 comparison supported in Xtensa. We shouldn't have to
826 transform <LE x const> comparisons, because neither
827 xtensa_expand_conditional_branch() nor get_condition() will
828 produce them. */
830 if ((code == GT) && (op1 == constm1_rtx))
832 code = GE;
833 op1 = const0_rtx;
835 cmp = gen_rtx_fmt_ee (code, VOIDmode, cc0_rtx, const0_rtx);
837 if (boolean_operator (cmp, VOIDmode))
839 /* Swap the operands to make const0 second. */
840 if (op0 == const0_rtx)
842 op0 = op1;
843 op1 = const0_rtx;
846 /* If not comparing against zero, emit a comparison (subtract). */
847 if (op1 != const0_rtx)
849 op0 = expand_binop (SImode, sub_optab, op0, op1,
850 0, 0, OPTAB_LIB_WIDEN);
851 op1 = const0_rtx;
854 else if (branch_operator (cmp, VOIDmode))
856 /* Swap the operands to make const0 second. */
857 if (op0 == const0_rtx)
859 op0 = op1;
860 op1 = const0_rtx;
862 switch (code)
864 case LT: code = GE; break;
865 case GE: code = LT; break;
866 default: gcc_unreachable ();
870 if (op1 != const0_rtx)
871 return 0;
873 else
874 return 0;
876 return gen_rtx_fmt_ee (code, VOIDmode, op0, op1);
879 if (TARGET_HARD_FLOAT && (branch_type == CMP_SF))
880 return gen_float_relational (code, op0, op1);
882 return 0;
887 xtensa_expand_conditional_move (rtx *operands, int isflt)
889 rtx cmp;
890 rtx (*gen_fn) (rtx, rtx, rtx, rtx, rtx);
892 if (!(cmp = gen_conditional_move (operands[1])))
893 return 0;
895 if (isflt)
896 gen_fn = (branch_type == CMP_SI
897 ? gen_movsfcc_internal0
898 : gen_movsfcc_internal1);
899 else
900 gen_fn = (branch_type == CMP_SI
901 ? gen_movsicc_internal0
902 : gen_movsicc_internal1);
904 emit_insn (gen_fn (operands[0], XEXP (cmp, 0),
905 operands[2], operands[3], cmp));
906 return 1;
911 xtensa_expand_scc (rtx *operands)
913 rtx dest = operands[0];
914 rtx cmp = operands[1];
915 rtx one_tmp, zero_tmp;
916 rtx (*gen_fn) (rtx, rtx, rtx, rtx, rtx);
918 if (!(cmp = gen_conditional_move (cmp)))
919 return 0;
921 one_tmp = gen_reg_rtx (SImode);
922 zero_tmp = gen_reg_rtx (SImode);
923 emit_insn (gen_movsi (one_tmp, const_true_rtx));
924 emit_insn (gen_movsi (zero_tmp, const0_rtx));
926 gen_fn = (branch_type == CMP_SI
927 ? gen_movsicc_internal0
928 : gen_movsicc_internal1);
929 emit_insn (gen_fn (dest, XEXP (cmp, 0), one_tmp, zero_tmp, cmp));
930 return 1;
934 /* Split OP[1] into OP[2,3] and likewise for OP[0] into OP[0,1]. MODE is
935 for the output, i.e., the input operands are twice as big as MODE. */
937 void
938 xtensa_split_operand_pair (rtx operands[4], enum machine_mode mode)
940 switch (GET_CODE (operands[1]))
942 case REG:
943 operands[3] = gen_rtx_REG (mode, REGNO (operands[1]) + 1);
944 operands[2] = gen_rtx_REG (mode, REGNO (operands[1]));
945 break;
947 case MEM:
948 operands[3] = adjust_address (operands[1], mode, GET_MODE_SIZE (mode));
949 operands[2] = adjust_address (operands[1], mode, 0);
950 break;
952 case CONST_INT:
953 case CONST_DOUBLE:
954 split_double (operands[1], &operands[2], &operands[3]);
955 break;
957 default:
958 gcc_unreachable ();
961 switch (GET_CODE (operands[0]))
963 case REG:
964 operands[1] = gen_rtx_REG (mode, REGNO (operands[0]) + 1);
965 operands[0] = gen_rtx_REG (mode, REGNO (operands[0]));
966 break;
968 case MEM:
969 operands[1] = adjust_address (operands[0], mode, GET_MODE_SIZE (mode));
970 operands[0] = adjust_address (operands[0], mode, 0);
971 break;
973 default:
974 gcc_unreachable ();
979 /* Emit insns to move operands[1] into operands[0].
980 Return 1 if we have written out everything that needs to be done to
981 do the move. Otherwise, return 0 and the caller will emit the move
982 normally. */
985 xtensa_emit_move_sequence (rtx *operands, enum machine_mode mode)
987 if (CONSTANT_P (operands[1])
988 && (GET_CODE (operands[1]) != CONST_INT
989 || !xtensa_simm12b (INTVAL (operands[1]))))
991 if (!TARGET_CONST16)
992 operands[1] = force_const_mem (SImode, operands[1]);
994 /* PC-relative loads are always SImode, and CONST16 is only
995 supported in the movsi pattern, so add a SUBREG for any other
996 (smaller) mode. */
998 if (mode != SImode)
1000 if (register_operand (operands[0], mode))
1002 operands[0] = simplify_gen_subreg (SImode, operands[0], mode, 0);
1003 emit_move_insn (operands[0], operands[1]);
1004 return 1;
1006 else
1008 operands[1] = force_reg (SImode, operands[1]);
1009 operands[1] = gen_lowpart_SUBREG (mode, operands[1]);
1014 if (!(reload_in_progress | reload_completed)
1015 && !xtensa_valid_move (mode, operands))
1016 operands[1] = force_reg (mode, operands[1]);
1018 operands[1] = xtensa_copy_incoming_a7 (operands[1]);
1020 /* During reload we don't want to emit (subreg:X (mem:Y)) since that
1021 instruction won't be recognized after reload, so we remove the
1022 subreg and adjust mem accordingly. */
1023 if (reload_in_progress)
1025 operands[0] = fixup_subreg_mem (operands[0]);
1026 operands[1] = fixup_subreg_mem (operands[1]);
1028 return 0;
1032 static rtx
1033 fixup_subreg_mem (rtx x)
1035 if (GET_CODE (x) == SUBREG
1036 && GET_CODE (SUBREG_REG (x)) == REG
1037 && REGNO (SUBREG_REG (x)) >= FIRST_PSEUDO_REGISTER)
1039 rtx temp =
1040 gen_rtx_SUBREG (GET_MODE (x),
1041 reg_equiv_mem [REGNO (SUBREG_REG (x))],
1042 SUBREG_BYTE (x));
1043 x = alter_subreg (&temp);
1045 return x;
1049 /* Check if an incoming argument in a7 is expected to be used soon and
1050 if OPND is a register or register pair that includes a7. If so,
1051 create a new pseudo and copy a7 into that pseudo at the very
1052 beginning of the function, followed by the special "set_frame_ptr"
1053 unspec_volatile insn. The return value is either the original
1054 operand, if it is not a7, or the new pseudo containing a copy of
1055 the incoming argument. This is necessary because the register
1056 allocator will ignore conflicts with a7 and may either assign some
1057 other pseudo to a7 or use a7 as the hard_frame_pointer, clobbering
1058 the incoming argument in a7. By copying the argument out of a7 as
1059 the very first thing, and then immediately following that with an
1060 unspec_volatile to keep the scheduler away, we should avoid any
1061 problems. Putting the set_frame_ptr insn at the beginning, with
1062 only the a7 copy before it, also makes it easier for the prologue
1063 expander to initialize the frame pointer after the a7 copy and to
1064 fix up the a7 copy to use the stack pointer instead of the frame
1065 pointer. */
1068 xtensa_copy_incoming_a7 (rtx opnd)
1070 rtx entry_insns = 0;
1071 rtx reg, tmp;
1072 enum machine_mode mode;
1074 if (!cfun->machine->need_a7_copy)
1075 return opnd;
1077 /* This function should never be called again once a7 has been copied. */
1078 gcc_assert (!cfun->machine->set_frame_ptr_insn);
1080 mode = GET_MODE (opnd);
1082 /* The operand using a7 may come in a later instruction, so just return
1083 the original operand if it doesn't use a7. */
1084 reg = opnd;
1085 if (GET_CODE (reg) == SUBREG)
1087 gcc_assert (SUBREG_BYTE (reg) == 0);
1088 reg = SUBREG_REG (reg);
1090 if (GET_CODE (reg) != REG
1091 || REGNO (reg) > A7_REG
1092 || REGNO (reg) + HARD_REGNO_NREGS (A7_REG, mode) <= A7_REG)
1093 return opnd;
1095 /* 1-word args will always be in a7; 2-word args in a6/a7. */
1096 gcc_assert (REGNO (reg) + HARD_REGNO_NREGS (A7_REG, mode) - 1 == A7_REG);
1098 cfun->machine->need_a7_copy = false;
1100 /* Copy a7 to a new pseudo at the function entry. Use gen_raw_REG to
1101 create the REG for a7 so that hard_frame_pointer_rtx is not used. */
1103 push_to_sequence (entry_insns);
1104 tmp = gen_reg_rtx (mode);
1106 switch (mode)
1108 case DFmode:
1109 case DImode:
1110 emit_insn (gen_movsi_internal (gen_rtx_SUBREG (SImode, tmp, 0),
1111 gen_rtx_REG (SImode, A7_REG - 1)));
1112 emit_insn (gen_movsi_internal (gen_rtx_SUBREG (SImode, tmp, 4),
1113 gen_raw_REG (SImode, A7_REG)));
1114 break;
1115 case SFmode:
1116 emit_insn (gen_movsf_internal (tmp, gen_raw_REG (mode, A7_REG)));
1117 break;
1118 case SImode:
1119 emit_insn (gen_movsi_internal (tmp, gen_raw_REG (mode, A7_REG)));
1120 break;
1121 case HImode:
1122 emit_insn (gen_movhi_internal (tmp, gen_raw_REG (mode, A7_REG)));
1123 break;
1124 case QImode:
1125 emit_insn (gen_movqi_internal (tmp, gen_raw_REG (mode, A7_REG)));
1126 break;
1127 default:
1128 gcc_unreachable ();
1131 cfun->machine->set_frame_ptr_insn = emit_insn (gen_set_frame_ptr ());
1132 entry_insns = get_insns ();
1133 end_sequence ();
1135 if (cfun->machine->vararg_a7)
1137 /* This is called from within builtin_savereg, so we're already
1138 inside a start_sequence that will be placed at the start of
1139 the function. */
1140 emit_insn (entry_insns);
1142 else
1144 /* Put entry_insns after the NOTE that starts the function. If
1145 this is inside a start_sequence, make the outer-level insn
1146 chain current, so the code is placed at the start of the
1147 function. */
1148 push_topmost_sequence ();
1149 emit_insn_after (entry_insns, get_insns ());
1150 pop_topmost_sequence ();
1153 return tmp;
1157 /* Try to expand a block move operation to a sequence of RTL move
1158 instructions. If not optimizing, or if the block size is not a
1159 constant, or if the block is too large, the expansion fails and GCC
1160 falls back to calling memcpy().
1162 operands[0] is the destination
1163 operands[1] is the source
1164 operands[2] is the length
1165 operands[3] is the alignment */
1168 xtensa_expand_block_move (rtx *operands)
1170 static const enum machine_mode mode_from_align[] =
1172 VOIDmode, QImode, HImode, VOIDmode, SImode,
1175 rtx dst_mem = operands[0];
1176 rtx src_mem = operands[1];
1177 HOST_WIDE_INT bytes, align;
1178 int num_pieces, move_ratio;
1179 rtx temp[2];
1180 enum machine_mode mode[2];
1181 int amount[2];
1182 bool active[2];
1183 int phase = 0;
1184 int next;
1185 int offset_ld = 0;
1186 int offset_st = 0;
1187 rtx x;
1189 /* If this is not a fixed size move, just call memcpy. */
1190 if (!optimize || (GET_CODE (operands[2]) != CONST_INT))
1191 return 0;
1193 bytes = INTVAL (operands[2]);
1194 align = INTVAL (operands[3]);
1196 /* Anything to move? */
1197 if (bytes <= 0)
1198 return 0;
1200 if (align > MOVE_MAX)
1201 align = MOVE_MAX;
1203 /* Decide whether to expand inline based on the optimization level. */
1204 move_ratio = 4;
1205 if (optimize > 2)
1206 move_ratio = LARGEST_MOVE_RATIO;
1207 num_pieces = (bytes / align) + (bytes % align); /* Close enough anyway. */
1208 if (num_pieces > move_ratio)
1209 return 0;
1211 x = XEXP (dst_mem, 0);
1212 if (!REG_P (x))
1214 x = force_reg (Pmode, x);
1215 dst_mem = replace_equiv_address (dst_mem, x);
1218 x = XEXP (src_mem, 0);
1219 if (!REG_P (x))
1221 x = force_reg (Pmode, x);
1222 src_mem = replace_equiv_address (src_mem, x);
1225 active[0] = active[1] = false;
1229 next = phase;
1230 phase ^= 1;
1232 if (bytes > 0)
1234 int next_amount;
1236 next_amount = (bytes >= 4 ? 4 : (bytes >= 2 ? 2 : 1));
1237 next_amount = MIN (next_amount, align);
1239 amount[next] = next_amount;
1240 mode[next] = mode_from_align[next_amount];
1241 temp[next] = gen_reg_rtx (mode[next]);
1243 x = adjust_address (src_mem, mode[next], offset_ld);
1244 emit_insn (gen_rtx_SET (VOIDmode, temp[next], x));
1246 offset_ld += next_amount;
1247 bytes -= next_amount;
1248 active[next] = true;
1251 if (active[phase])
1253 active[phase] = false;
1255 x = adjust_address (dst_mem, mode[phase], offset_st);
1256 emit_insn (gen_rtx_SET (VOIDmode, x, temp[phase]));
1258 offset_st += amount[phase];
1261 while (active[next]);
1263 return 1;
1267 void
1268 xtensa_expand_nonlocal_goto (rtx *operands)
1270 rtx goto_handler = operands[1];
1271 rtx containing_fp = operands[3];
1273 /* Generate a call to "__xtensa_nonlocal_goto" (in libgcc); the code
1274 is too big to generate in-line. */
1276 if (GET_CODE (containing_fp) != REG)
1277 containing_fp = force_reg (Pmode, containing_fp);
1279 goto_handler = replace_rtx (copy_rtx (goto_handler),
1280 virtual_stack_vars_rtx,
1281 containing_fp);
1283 emit_library_call (gen_rtx_SYMBOL_REF (Pmode, "__xtensa_nonlocal_goto"),
1284 0, VOIDmode, 2,
1285 containing_fp, Pmode,
1286 goto_handler, Pmode);
1290 static struct machine_function *
1291 xtensa_init_machine_status (void)
1293 return ggc_alloc_cleared (sizeof (struct machine_function));
1297 void
1298 xtensa_setup_frame_addresses (void)
1300 /* Set flag to cause FRAME_POINTER_REQUIRED to be set. */
1301 cfun->machine->accesses_prev_frame = 1;
1303 emit_library_call
1304 (gen_rtx_SYMBOL_REF (Pmode, "__xtensa_libgcc_window_spill"),
1305 0, VOIDmode, 0);
1309 /* Emit the assembly for the end of a zero-cost loop. Normally we just emit
1310 a comment showing where the end of the loop is. However, if there is a
1311 label or a branch at the end of the loop then we need to place a nop
1312 there. If the loop ends with a label we need the nop so that branches
1313 targeting that label will target the nop (and thus remain in the loop),
1314 instead of targeting the instruction after the loop (and thus exiting
1315 the loop). If the loop ends with a branch, we need the nop in case the
1316 branch is targeting a location inside the loop. When the branch
1317 executes it will cause the loop count to be decremented even if it is
1318 taken (because it is the last instruction in the loop), so we need to
1319 nop after the branch to prevent the loop count from being decremented
1320 when the branch is taken. */
1322 void
1323 xtensa_emit_loop_end (rtx insn, rtx *operands)
1325 char done = 0;
1327 for (insn = PREV_INSN (insn); insn && !done; insn = PREV_INSN (insn))
1329 switch (GET_CODE (insn))
1331 case NOTE:
1332 case BARRIER:
1333 break;
1335 case CODE_LABEL:
1336 output_asm_insn (TARGET_DENSITY ? "nop.n" : "nop", operands);
1337 done = 1;
1338 break;
1340 default:
1342 rtx body = PATTERN (insn);
1344 if (GET_CODE (body) == JUMP_INSN)
1346 output_asm_insn (TARGET_DENSITY ? "nop.n" : "nop", operands);
1347 done = 1;
1349 else if ((GET_CODE (body) != USE)
1350 && (GET_CODE (body) != CLOBBER))
1351 done = 1;
1353 break;
1357 output_asm_insn ("# loop end for %0", operands);
1361 char *
1362 xtensa_emit_call (int callop, rtx *operands)
1364 static char result[64];
1365 rtx tgt = operands[callop];
1367 if (GET_CODE (tgt) == CONST_INT)
1368 sprintf (result, "call8\t0x%lx", INTVAL (tgt));
1369 else if (register_operand (tgt, VOIDmode))
1370 sprintf (result, "callx8\t%%%d", callop);
1371 else
1372 sprintf (result, "call8\t%%%d", callop);
1374 return result;
1378 /* Return the debugger register number to use for 'regno'. */
1381 xtensa_dbx_register_number (int regno)
1383 int first = -1;
1385 if (GP_REG_P (regno))
1387 regno -= GP_REG_FIRST;
1388 first = 0;
1390 else if (BR_REG_P (regno))
1392 regno -= BR_REG_FIRST;
1393 first = 16;
1395 else if (FP_REG_P (regno))
1397 regno -= FP_REG_FIRST;
1398 first = 48;
1400 else if (ACC_REG_P (regno))
1402 first = 0x200; /* Start of Xtensa special registers. */
1403 regno = 16; /* ACCLO is special register 16. */
1406 /* When optimizing, we sometimes get asked about pseudo-registers
1407 that don't represent hard registers. Return 0 for these. */
1408 if (first == -1)
1409 return 0;
1411 return first + regno;
1415 /* Argument support functions. */
1417 /* Initialize CUMULATIVE_ARGS for a function. */
1419 void
1420 init_cumulative_args (CUMULATIVE_ARGS *cum, int incoming)
1422 cum->arg_words = 0;
1423 cum->incoming = incoming;
1427 /* Advance the argument to the next argument position. */
1429 void
1430 function_arg_advance (CUMULATIVE_ARGS *cum, enum machine_mode mode, tree type)
1432 int words, max;
1433 int *arg_words;
1435 arg_words = &cum->arg_words;
1436 max = MAX_ARGS_IN_REGISTERS;
1438 words = (((mode != BLKmode)
1439 ? (int) GET_MODE_SIZE (mode)
1440 : int_size_in_bytes (type)) + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
1442 if (*arg_words < max
1443 && (targetm.calls.must_pass_in_stack (mode, type)
1444 || *arg_words + words > max))
1445 *arg_words = max;
1447 *arg_words += words;
1451 /* Return an RTL expression containing the register for the given mode,
1452 or 0 if the argument is to be passed on the stack. INCOMING_P is nonzero
1453 if this is an incoming argument to the current function. */
1456 function_arg (CUMULATIVE_ARGS *cum, enum machine_mode mode, tree type,
1457 int incoming_p)
1459 int regbase, words, max;
1460 int *arg_words;
1461 int regno;
1463 arg_words = &cum->arg_words;
1464 regbase = (incoming_p ? GP_ARG_FIRST : GP_OUTGOING_ARG_FIRST);
1465 max = MAX_ARGS_IN_REGISTERS;
1467 words = (((mode != BLKmode)
1468 ? (int) GET_MODE_SIZE (mode)
1469 : int_size_in_bytes (type)) + UNITS_PER_WORD - 1) / UNITS_PER_WORD;
1471 if (type && (TYPE_ALIGN (type) > BITS_PER_WORD))
1473 int align = MIN (TYPE_ALIGN (type), STACK_BOUNDARY) / BITS_PER_WORD;
1474 *arg_words = (*arg_words + align - 1) & -align;
1477 if (*arg_words + words > max)
1478 return (rtx)0;
1480 regno = regbase + *arg_words;
1482 if (cum->incoming && regno <= A7_REG && regno + words > A7_REG)
1483 cfun->machine->need_a7_copy = true;
1485 return gen_rtx_REG (mode, regno);
1490 function_arg_boundary (enum machine_mode mode, tree type)
1492 unsigned int alignment;
1494 alignment = type ? TYPE_ALIGN (type) : GET_MODE_ALIGNMENT (mode);
1495 if (alignment < PARM_BOUNDARY)
1496 alignment = PARM_BOUNDARY;
1497 if (alignment > STACK_BOUNDARY)
1498 alignment = STACK_BOUNDARY;
1499 return alignment;
1503 static bool
1504 xtensa_return_in_msb (tree valtype)
1506 return (TARGET_BIG_ENDIAN
1507 && AGGREGATE_TYPE_P (valtype)
1508 && int_size_in_bytes (valtype) >= UNITS_PER_WORD);
1512 void
1513 override_options (void)
1515 int regno;
1516 enum machine_mode mode;
1518 if (!TARGET_BOOLEANS && TARGET_HARD_FLOAT)
1519 error ("boolean registers required for the floating-point option");
1521 xtensa_char_to_class['q'] = SP_REG;
1522 xtensa_char_to_class['a'] = GR_REGS;
1523 xtensa_char_to_class['b'] = ((TARGET_BOOLEANS) ? BR_REGS : NO_REGS);
1524 xtensa_char_to_class['f'] = ((TARGET_HARD_FLOAT) ? FP_REGS : NO_REGS);
1525 xtensa_char_to_class['A'] = ((TARGET_MAC16) ? ACC_REG : NO_REGS);
1526 xtensa_char_to_class['B'] = ((TARGET_SEXT) ? GR_REGS : NO_REGS);
1527 xtensa_char_to_class['C'] = ((TARGET_MUL16) ? GR_REGS: NO_REGS);
1528 xtensa_char_to_class['D'] = ((TARGET_DENSITY) ? GR_REGS: NO_REGS);
1529 xtensa_char_to_class['d'] = ((TARGET_DENSITY) ? AR_REGS: NO_REGS);
1530 xtensa_char_to_class['W'] = ((TARGET_CONST16) ? GR_REGS: NO_REGS);
1532 /* Set up array giving whether a given register can hold a given mode. */
1533 for (mode = VOIDmode;
1534 mode != MAX_MACHINE_MODE;
1535 mode = (enum machine_mode) ((int) mode + 1))
1537 int size = GET_MODE_SIZE (mode);
1538 enum mode_class class = GET_MODE_CLASS (mode);
1540 for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
1542 int temp;
1544 if (ACC_REG_P (regno))
1545 temp = (TARGET_MAC16
1546 && (class == MODE_INT) && (size <= UNITS_PER_WORD));
1547 else if (GP_REG_P (regno))
1548 temp = ((regno & 1) == 0 || (size <= UNITS_PER_WORD));
1549 else if (FP_REG_P (regno))
1550 temp = (TARGET_HARD_FLOAT && (mode == SFmode));
1551 else if (BR_REG_P (regno))
1552 temp = (TARGET_BOOLEANS && (mode == CCmode));
1553 else
1554 temp = FALSE;
1556 xtensa_hard_regno_mode_ok[(int) mode][regno] = temp;
1560 init_machine_status = xtensa_init_machine_status;
1562 /* Check PIC settings. PIC is only supported when using L32R
1563 instructions, and some targets need to always use PIC. */
1564 if (flag_pic && TARGET_CONST16)
1565 error ("-f%s is not supported with CONST16 instructions",
1566 (flag_pic > 1 ? "PIC" : "pic"));
1567 else if (XTENSA_ALWAYS_PIC)
1569 if (TARGET_CONST16)
1570 error ("PIC is required but not supported with CONST16 instructions");
1571 flag_pic = 1;
1573 /* There's no need for -fPIC (as opposed to -fpic) on Xtensa. */
1574 if (flag_pic > 1)
1575 flag_pic = 1;
1577 /* Hot/cold partitioning does not work on this architecture, because of
1578 constant pools (the load instruction cannot necessarily reach that far).
1579 Therefore disable it on this architecture. */
1580 if (flag_reorder_blocks_and_partition)
1582 flag_reorder_blocks_and_partition = 0;
1583 flag_reorder_blocks = 1;
1588 /* A C compound statement to output to stdio stream STREAM the
1589 assembler syntax for an instruction operand X. X is an RTL
1590 expression.
1592 CODE is a value that can be used to specify one of several ways
1593 of printing the operand. It is used when identical operands
1594 must be printed differently depending on the context. CODE
1595 comes from the '%' specification that was used to request
1596 printing of the operand. If the specification was just '%DIGIT'
1597 then CODE is 0; if the specification was '%LTR DIGIT' then CODE
1598 is the ASCII code for LTR.
1600 If X is a register, this macro should print the register's name.
1601 The names can be found in an array 'reg_names' whose type is
1602 'char *[]'. 'reg_names' is initialized from 'REGISTER_NAMES'.
1604 When the machine description has a specification '%PUNCT' (a '%'
1605 followed by a punctuation character), this macro is called with
1606 a null pointer for X and the punctuation character for CODE.
1608 'a', 'c', 'l', and 'n' are reserved.
1610 The Xtensa specific codes are:
1612 'd' CONST_INT, print as signed decimal
1613 'x' CONST_INT, print as signed hexadecimal
1614 'K' CONST_INT, print number of bits in mask for EXTUI
1615 'R' CONST_INT, print (X & 0x1f)
1616 'L' CONST_INT, print ((32 - X) & 0x1f)
1617 'D' REG, print second register of double-word register operand
1618 'N' MEM, print address of next word following a memory operand
1619 'v' MEM, if memory reference is volatile, output a MEMW before it
1620 't' any constant, add "@h" suffix for top 16 bits
1621 'b' any constant, add "@l" suffix for bottom 16 bits
1624 static void
1625 printx (FILE *file, signed int val)
1627 /* Print a hexadecimal value in a nice way. */
1628 if ((val > -0xa) && (val < 0xa))
1629 fprintf (file, "%d", val);
1630 else if (val < 0)
1631 fprintf (file, "-0x%x", -val);
1632 else
1633 fprintf (file, "0x%x", val);
1637 void
1638 print_operand (FILE *file, rtx x, int letter)
1640 if (!x)
1641 error ("PRINT_OPERAND null pointer");
1643 switch (letter)
1645 case 'D':
1646 if (GET_CODE (x) == REG || GET_CODE (x) == SUBREG)
1647 fprintf (file, "%s", reg_names[xt_true_regnum (x) + 1]);
1648 else
1649 output_operand_lossage ("invalid %%D value");
1650 break;
1652 case 'v':
1653 if (GET_CODE (x) == MEM)
1655 /* For a volatile memory reference, emit a MEMW before the
1656 load or store. */
1657 if (MEM_VOLATILE_P (x))
1658 fprintf (file, "memw\n\t");
1660 else
1661 output_operand_lossage ("invalid %%v value");
1662 break;
1664 case 'N':
1665 if (GET_CODE (x) == MEM
1666 && (GET_MODE (x) == DFmode || GET_MODE (x) == DImode))
1668 x = adjust_address (x, GET_MODE (x) == DFmode ? SFmode : SImode, 4);
1669 output_address (XEXP (x, 0));
1671 else
1672 output_operand_lossage ("invalid %%N value");
1673 break;
1675 case 'K':
1676 if (GET_CODE (x) == CONST_INT)
1678 int num_bits = 0;
1679 unsigned val = INTVAL (x);
1680 while (val & 1)
1682 num_bits += 1;
1683 val = val >> 1;
1685 if ((val != 0) || (num_bits == 0) || (num_bits > 16))
1686 fatal_insn ("invalid mask", x);
1688 fprintf (file, "%d", num_bits);
1690 else
1691 output_operand_lossage ("invalid %%K value");
1692 break;
1694 case 'L':
1695 if (GET_CODE (x) == CONST_INT)
1696 fprintf (file, "%ld", (32 - INTVAL (x)) & 0x1f);
1697 else
1698 output_operand_lossage ("invalid %%L value");
1699 break;
1701 case 'R':
1702 if (GET_CODE (x) == CONST_INT)
1703 fprintf (file, "%ld", INTVAL (x) & 0x1f);
1704 else
1705 output_operand_lossage ("invalid %%R value");
1706 break;
1708 case 'x':
1709 if (GET_CODE (x) == CONST_INT)
1710 printx (file, INTVAL (x));
1711 else
1712 output_operand_lossage ("invalid %%x value");
1713 break;
1715 case 'd':
1716 if (GET_CODE (x) == CONST_INT)
1717 fprintf (file, "%ld", INTVAL (x));
1718 else
1719 output_operand_lossage ("invalid %%d value");
1720 break;
1722 case 't':
1723 case 'b':
1724 if (GET_CODE (x) == CONST_INT)
1726 printx (file, INTVAL (x));
1727 fputs (letter == 't' ? "@h" : "@l", file);
1729 else if (GET_CODE (x) == CONST_DOUBLE)
1731 REAL_VALUE_TYPE r;
1732 REAL_VALUE_FROM_CONST_DOUBLE (r, x);
1733 if (GET_MODE (x) == SFmode)
1735 long l;
1736 REAL_VALUE_TO_TARGET_SINGLE (r, l);
1737 fprintf (file, "0x%08lx@%c", l, letter == 't' ? 'h' : 'l');
1739 else
1740 output_operand_lossage ("invalid %%t/%%b value");
1742 else if (GET_CODE (x) == CONST)
1744 /* X must be a symbolic constant on ELF. Write an expression
1745 suitable for 'const16' that sets the high or low 16 bits. */
1746 if (GET_CODE (XEXP (x, 0)) != PLUS
1747 || (GET_CODE (XEXP (XEXP (x, 0), 0)) != SYMBOL_REF
1748 && GET_CODE (XEXP (XEXP (x, 0), 0)) != LABEL_REF)
1749 || GET_CODE (XEXP (XEXP (x, 0), 1)) != CONST_INT)
1750 output_operand_lossage ("invalid %%t/%%b value");
1751 print_operand (file, XEXP (XEXP (x, 0), 0), 0);
1752 fputs (letter == 't' ? "@h" : "@l", file);
1753 /* There must be a non-alphanumeric character between 'h' or 'l'
1754 and the number. The '-' is added by print_operand() already. */
1755 if (INTVAL (XEXP (XEXP (x, 0), 1)) >= 0)
1756 fputs ("+", file);
1757 print_operand (file, XEXP (XEXP (x, 0), 1), 0);
1759 else
1761 output_addr_const (file, x);
1762 fputs (letter == 't' ? "@h" : "@l", file);
1764 break;
1766 default:
1767 if (GET_CODE (x) == REG || GET_CODE (x) == SUBREG)
1768 fprintf (file, "%s", reg_names[xt_true_regnum (x)]);
1769 else if (GET_CODE (x) == MEM)
1770 output_address (XEXP (x, 0));
1771 else if (GET_CODE (x) == CONST_INT)
1772 fprintf (file, "%ld", INTVAL (x));
1773 else
1774 output_addr_const (file, x);
1779 /* A C compound statement to output to stdio stream STREAM the
1780 assembler syntax for an instruction operand that is a memory
1781 reference whose address is ADDR. ADDR is an RTL expression. */
1783 void
1784 print_operand_address (FILE *file, rtx addr)
1786 if (!addr)
1787 error ("PRINT_OPERAND_ADDRESS, null pointer");
1789 switch (GET_CODE (addr))
1791 default:
1792 fatal_insn ("invalid address", addr);
1793 break;
1795 case REG:
1796 fprintf (file, "%s, 0", reg_names [REGNO (addr)]);
1797 break;
1799 case PLUS:
1801 rtx reg = (rtx)0;
1802 rtx offset = (rtx)0;
1803 rtx arg0 = XEXP (addr, 0);
1804 rtx arg1 = XEXP (addr, 1);
1806 if (GET_CODE (arg0) == REG)
1808 reg = arg0;
1809 offset = arg1;
1811 else if (GET_CODE (arg1) == REG)
1813 reg = arg1;
1814 offset = arg0;
1816 else
1817 fatal_insn ("no register in address", addr);
1819 if (CONSTANT_P (offset))
1821 fprintf (file, "%s, ", reg_names [REGNO (reg)]);
1822 output_addr_const (file, offset);
1824 else
1825 fatal_insn ("address offset not a constant", addr);
1827 break;
1829 case LABEL_REF:
1830 case SYMBOL_REF:
1831 case CONST_INT:
1832 case CONST:
1833 output_addr_const (file, addr);
1834 break;
1839 void
1840 xtensa_output_literal (FILE *file, rtx x, enum machine_mode mode, int labelno)
1842 long value_long[2];
1843 REAL_VALUE_TYPE r;
1844 int size;
1846 fprintf (file, "\t.literal .LC%u, ", (unsigned) labelno);
1848 switch (GET_MODE_CLASS (mode))
1850 case MODE_FLOAT:
1851 gcc_assert (GET_CODE (x) == CONST_DOUBLE);
1853 REAL_VALUE_FROM_CONST_DOUBLE (r, x);
1854 switch (mode)
1856 case SFmode:
1857 REAL_VALUE_TO_TARGET_SINGLE (r, value_long[0]);
1858 fprintf (file, "0x%08lx\n", value_long[0]);
1859 break;
1861 case DFmode:
1862 REAL_VALUE_TO_TARGET_DOUBLE (r, value_long);
1863 fprintf (file, "0x%08lx, 0x%08lx\n",
1864 value_long[0], value_long[1]);
1865 break;
1867 default:
1868 gcc_unreachable ();
1871 break;
1873 case MODE_INT:
1874 case MODE_PARTIAL_INT:
1875 size = GET_MODE_SIZE (mode);
1876 switch (size)
1878 case 4:
1879 output_addr_const (file, x);
1880 fputs ("\n", file);
1881 break;
1883 case 8:
1884 output_addr_const (file, operand_subword (x, 0, 0, DImode));
1885 fputs (", ", file);
1886 output_addr_const (file, operand_subword (x, 1, 0, DImode));
1887 fputs ("\n", file);
1888 break;
1890 default:
1891 gcc_unreachable ();
1893 break;
1895 default:
1896 gcc_unreachable ();
1901 /* Return the bytes needed to compute the frame pointer from the current
1902 stack pointer. */
1904 #define STACK_BYTES (STACK_BOUNDARY / BITS_PER_UNIT)
1905 #define XTENSA_STACK_ALIGN(LOC) (((LOC) + STACK_BYTES-1) & ~(STACK_BYTES-1))
1907 long
1908 compute_frame_size (int size)
1910 /* Add space for the incoming static chain value. */
1911 if (cfun->static_chain_decl != NULL)
1912 size += (1 * UNITS_PER_WORD);
1914 xtensa_current_frame_size =
1915 XTENSA_STACK_ALIGN (size
1916 + current_function_outgoing_args_size
1917 + (WINDOW_SIZE * UNITS_PER_WORD));
1918 return xtensa_current_frame_size;
1923 xtensa_frame_pointer_required (void)
1925 /* The code to expand builtin_frame_addr and builtin_return_addr
1926 currently uses the hard_frame_pointer instead of frame_pointer.
1927 This seems wrong but maybe it's necessary for other architectures.
1928 This function is derived from the i386 code. */
1930 if (cfun->machine->accesses_prev_frame)
1931 return 1;
1933 return 0;
1937 void
1938 xtensa_expand_prologue (void)
1940 HOST_WIDE_INT total_size;
1941 rtx size_rtx;
1943 total_size = compute_frame_size (get_frame_size ());
1944 size_rtx = GEN_INT (total_size);
1946 if (total_size < (1 << (12+3)))
1947 emit_insn (gen_entry (size_rtx, size_rtx));
1948 else
1950 /* Use a8 as a temporary since a0-a7 may be live. */
1951 rtx tmp_reg = gen_rtx_REG (Pmode, A8_REG);
1952 emit_insn (gen_entry (size_rtx, GEN_INT (MIN_FRAME_SIZE)));
1953 emit_move_insn (tmp_reg, GEN_INT (total_size - MIN_FRAME_SIZE));
1954 emit_insn (gen_subsi3 (tmp_reg, stack_pointer_rtx, tmp_reg));
1955 emit_move_insn (stack_pointer_rtx, tmp_reg);
1958 if (frame_pointer_needed)
1960 if (cfun->machine->set_frame_ptr_insn)
1962 rtx first, insn;
1964 push_topmost_sequence ();
1965 first = get_insns ();
1966 pop_topmost_sequence ();
1968 /* For all instructions prior to set_frame_ptr_insn, replace
1969 hard_frame_pointer references with stack_pointer. */
1970 for (insn = first;
1971 insn != cfun->machine->set_frame_ptr_insn;
1972 insn = NEXT_INSN (insn))
1974 if (INSN_P (insn))
1975 PATTERN (insn) = replace_rtx (copy_rtx (PATTERN (insn)),
1976 hard_frame_pointer_rtx,
1977 stack_pointer_rtx);
1980 else
1981 emit_move_insn (hard_frame_pointer_rtx, stack_pointer_rtx);
1986 /* Clear variables at function end. */
1988 void
1989 xtensa_function_epilogue (FILE *file ATTRIBUTE_UNUSED,
1990 HOST_WIDE_INT size ATTRIBUTE_UNUSED)
1992 xtensa_current_frame_size = 0;
1997 xtensa_return_addr (int count, rtx frame)
1999 rtx result, retaddr;
2001 if (count == -1)
2002 retaddr = gen_rtx_REG (Pmode, A0_REG);
2003 else
2005 rtx addr = plus_constant (frame, -4 * UNITS_PER_WORD);
2006 addr = memory_address (Pmode, addr);
2007 retaddr = gen_reg_rtx (Pmode);
2008 emit_move_insn (retaddr, gen_rtx_MEM (Pmode, addr));
2011 /* The 2 most-significant bits of the return address on Xtensa hold
2012 the register window size. To get the real return address, these
2013 bits must be replaced with the high bits from the current PC. */
2015 result = gen_reg_rtx (Pmode);
2016 emit_insn (gen_fix_return_addr (result, retaddr));
2017 return result;
2021 /* Create the va_list data type.
2023 This structure is set up by __builtin_saveregs. The __va_reg field
2024 points to a stack-allocated region holding the contents of the
2025 incoming argument registers. The __va_ndx field is an index
2026 initialized to the position of the first unnamed (variable)
2027 argument. This same index is also used to address the arguments
2028 passed in memory. Thus, the __va_stk field is initialized to point
2029 to the position of the first argument in memory offset to account
2030 for the arguments passed in registers and to account for the size
2031 of the argument registers not being 16-byte aligned. E.G., there
2032 are 6 argument registers of 4 bytes each, but we want the __va_ndx
2033 for the first stack argument to have the maximal alignment of 16
2034 bytes, so we offset the __va_stk address by 32 bytes so that
2035 __va_stk[32] references the first argument on the stack. */
2037 static tree
2038 xtensa_build_builtin_va_list (void)
2040 tree f_stk, f_reg, f_ndx, record, type_decl;
2042 record = (*lang_hooks.types.make_type) (RECORD_TYPE);
2043 type_decl = build_decl (TYPE_DECL, get_identifier ("__va_list_tag"), record);
2045 f_stk = build_decl (FIELD_DECL, get_identifier ("__va_stk"),
2046 ptr_type_node);
2047 f_reg = build_decl (FIELD_DECL, get_identifier ("__va_reg"),
2048 ptr_type_node);
2049 f_ndx = build_decl (FIELD_DECL, get_identifier ("__va_ndx"),
2050 integer_type_node);
2052 DECL_FIELD_CONTEXT (f_stk) = record;
2053 DECL_FIELD_CONTEXT (f_reg) = record;
2054 DECL_FIELD_CONTEXT (f_ndx) = record;
2056 TREE_CHAIN (record) = type_decl;
2057 TYPE_NAME (record) = type_decl;
2058 TYPE_FIELDS (record) = f_stk;
2059 TREE_CHAIN (f_stk) = f_reg;
2060 TREE_CHAIN (f_reg) = f_ndx;
2062 layout_type (record);
2063 return record;
2067 /* Save the incoming argument registers on the stack. Returns the
2068 address of the saved registers. */
2070 static rtx
2071 xtensa_builtin_saveregs (void)
2073 rtx gp_regs, dest;
2074 int arg_words = current_function_args_info.arg_words;
2075 int gp_left = MAX_ARGS_IN_REGISTERS - arg_words;
2077 if (gp_left <= 0)
2078 return const0_rtx;
2080 /* Allocate the general-purpose register space. */
2081 gp_regs = assign_stack_local
2082 (BLKmode, MAX_ARGS_IN_REGISTERS * UNITS_PER_WORD, -1);
2083 set_mem_alias_set (gp_regs, get_varargs_alias_set ());
2085 /* Now store the incoming registers. */
2086 dest = change_address (gp_regs, SImode,
2087 plus_constant (XEXP (gp_regs, 0),
2088 arg_words * UNITS_PER_WORD));
2089 cfun->machine->need_a7_copy = true;
2090 cfun->machine->vararg_a7 = true;
2091 move_block_from_reg (GP_ARG_FIRST + arg_words, dest, gp_left);
2093 return XEXP (gp_regs, 0);
2097 /* Implement `va_start' for varargs and stdarg. We look at the
2098 current function to fill in an initial va_list. */
2100 void
2101 xtensa_va_start (tree valist, rtx nextarg ATTRIBUTE_UNUSED)
2103 tree f_stk, stk;
2104 tree f_reg, reg;
2105 tree f_ndx, ndx;
2106 tree t, u;
2107 int arg_words;
2109 arg_words = current_function_args_info.arg_words;
2111 f_stk = TYPE_FIELDS (va_list_type_node);
2112 f_reg = TREE_CHAIN (f_stk);
2113 f_ndx = TREE_CHAIN (f_reg);
2115 stk = build3 (COMPONENT_REF, TREE_TYPE (f_stk), valist, f_stk, NULL_TREE);
2116 reg = build3 (COMPONENT_REF, TREE_TYPE (f_reg), valist, f_reg, NULL_TREE);
2117 ndx = build3 (COMPONENT_REF, TREE_TYPE (f_ndx), valist, f_ndx, NULL_TREE);
2119 /* Call __builtin_saveregs; save the result in __va_reg */
2120 u = make_tree (ptr_type_node, expand_builtin_saveregs ());
2121 t = build2 (MODIFY_EXPR, ptr_type_node, reg, u);
2122 TREE_SIDE_EFFECTS (t) = 1;
2123 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
2125 /* Set the __va_stk member to ($arg_ptr - 32). */
2126 u = make_tree (ptr_type_node, virtual_incoming_args_rtx);
2127 u = fold_build2 (PLUS_EXPR, ptr_type_node, u,
2128 build_int_cst (NULL_TREE, -32));
2129 t = build2 (MODIFY_EXPR, ptr_type_node, stk, u);
2130 TREE_SIDE_EFFECTS (t) = 1;
2131 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
2133 /* Set the __va_ndx member. If the first variable argument is on
2134 the stack, adjust __va_ndx by 2 words to account for the extra
2135 alignment offset for __va_stk. */
2136 if (arg_words >= MAX_ARGS_IN_REGISTERS)
2137 arg_words += 2;
2138 u = build_int_cst (NULL_TREE, arg_words * UNITS_PER_WORD);
2139 t = build2 (MODIFY_EXPR, integer_type_node, ndx, u);
2140 TREE_SIDE_EFFECTS (t) = 1;
2141 expand_expr (t, const0_rtx, VOIDmode, EXPAND_NORMAL);
2145 /* Implement `va_arg'. */
2147 static tree
2148 xtensa_gimplify_va_arg_expr (tree valist, tree type, tree *pre_p,
2149 tree *post_p ATTRIBUTE_UNUSED)
2151 tree f_stk, stk;
2152 tree f_reg, reg;
2153 tree f_ndx, ndx;
2154 tree type_size, array, orig_ndx, addr, size, va_size, t;
2155 tree lab_false, lab_over, lab_false2;
2156 bool indirect;
2158 indirect = pass_by_reference (NULL, TYPE_MODE (type), type, false);
2159 if (indirect)
2160 type = build_pointer_type (type);
2162 /* Handle complex values as separate real and imaginary parts. */
2163 if (TREE_CODE (type) == COMPLEX_TYPE)
2165 tree real_part, imag_part;
2167 real_part = xtensa_gimplify_va_arg_expr (valist, TREE_TYPE (type),
2168 pre_p, NULL);
2169 real_part = get_initialized_tmp_var (real_part, pre_p, NULL);
2171 imag_part = xtensa_gimplify_va_arg_expr (valist, TREE_TYPE (type),
2172 pre_p, NULL);
2173 imag_part = get_initialized_tmp_var (imag_part, pre_p, NULL);
2175 return build2 (COMPLEX_EXPR, type, real_part, imag_part);
2178 f_stk = TYPE_FIELDS (va_list_type_node);
2179 f_reg = TREE_CHAIN (f_stk);
2180 f_ndx = TREE_CHAIN (f_reg);
2182 stk = build3 (COMPONENT_REF, TREE_TYPE (f_stk), valist, f_stk, NULL_TREE);
2183 reg = build3 (COMPONENT_REF, TREE_TYPE (f_reg), valist, f_reg, NULL_TREE);
2184 ndx = build3 (COMPONENT_REF, TREE_TYPE (f_ndx), valist, f_ndx, NULL_TREE);
2186 type_size = size_in_bytes (type);
2187 va_size = round_up (type_size, UNITS_PER_WORD);
2188 gimplify_expr (&va_size, pre_p, NULL, is_gimple_val, fb_rvalue);
2191 /* First align __va_ndx if necessary for this arg:
2193 orig_ndx = (AP).__va_ndx;
2194 if (__alignof__ (TYPE) > 4 )
2195 orig_ndx = ((orig_ndx + __alignof__ (TYPE) - 1)
2196 & -__alignof__ (TYPE)); */
2198 orig_ndx = get_initialized_tmp_var (ndx, pre_p, NULL);
2200 if (TYPE_ALIGN (type) > BITS_PER_WORD)
2202 int align = MIN (TYPE_ALIGN (type), STACK_BOUNDARY) / BITS_PER_UNIT;
2204 t = build2 (PLUS_EXPR, integer_type_node, orig_ndx,
2205 build_int_cst (NULL_TREE, align - 1));
2206 t = build2 (BIT_AND_EXPR, integer_type_node, t,
2207 build_int_cst (NULL_TREE, -align));
2208 t = build2 (MODIFY_EXPR, integer_type_node, orig_ndx, t);
2209 gimplify_and_add (t, pre_p);
2213 /* Increment __va_ndx to point past the argument:
2215 (AP).__va_ndx = orig_ndx + __va_size (TYPE); */
2217 t = fold_convert (integer_type_node, va_size);
2218 t = build2 (PLUS_EXPR, integer_type_node, orig_ndx, t);
2219 t = build2 (MODIFY_EXPR, integer_type_node, ndx, t);
2220 gimplify_and_add (t, pre_p);
2223 /* Check if the argument is in registers:
2225 if ((AP).__va_ndx <= __MAX_ARGS_IN_REGISTERS * 4
2226 && !must_pass_in_stack (type))
2227 __array = (AP).__va_reg; */
2229 array = create_tmp_var (ptr_type_node, NULL);
2231 lab_over = NULL;
2232 if (!targetm.calls.must_pass_in_stack (TYPE_MODE (type), type))
2234 lab_false = create_artificial_label ();
2235 lab_over = create_artificial_label ();
2237 t = build_int_cst (NULL_TREE, MAX_ARGS_IN_REGISTERS * UNITS_PER_WORD);
2238 t = build2 (GT_EXPR, boolean_type_node, ndx, t);
2239 t = build3 (COND_EXPR, void_type_node, t,
2240 build1 (GOTO_EXPR, void_type_node, lab_false),
2241 NULL_TREE);
2242 gimplify_and_add (t, pre_p);
2244 t = build2 (MODIFY_EXPR, void_type_node, array, reg);
2245 gimplify_and_add (t, pre_p);
2247 t = build1 (GOTO_EXPR, void_type_node, lab_over);
2248 gimplify_and_add (t, pre_p);
2250 t = build1 (LABEL_EXPR, void_type_node, lab_false);
2251 gimplify_and_add (t, pre_p);
2255 /* ...otherwise, the argument is on the stack (never split between
2256 registers and the stack -- change __va_ndx if necessary):
2258 else
2260 if (orig_ndx <= __MAX_ARGS_IN_REGISTERS * 4)
2261 (AP).__va_ndx = 32 + __va_size (TYPE);
2262 __array = (AP).__va_stk;
2263 } */
2265 lab_false2 = create_artificial_label ();
2267 t = build_int_cst (NULL_TREE, MAX_ARGS_IN_REGISTERS * UNITS_PER_WORD);
2268 t = build2 (GT_EXPR, boolean_type_node, orig_ndx, t);
2269 t = build3 (COND_EXPR, void_type_node, t,
2270 build1 (GOTO_EXPR, void_type_node, lab_false2),
2271 NULL_TREE);
2272 gimplify_and_add (t, pre_p);
2274 t = size_binop (PLUS_EXPR, va_size, size_int (32));
2275 t = fold_convert (integer_type_node, t);
2276 t = build2 (MODIFY_EXPR, integer_type_node, ndx, t);
2277 gimplify_and_add (t, pre_p);
2279 t = build1 (LABEL_EXPR, void_type_node, lab_false2);
2280 gimplify_and_add (t, pre_p);
2282 t = build2 (MODIFY_EXPR, void_type_node, array, stk);
2283 gimplify_and_add (t, pre_p);
2285 if (lab_over)
2287 t = build1 (LABEL_EXPR, void_type_node, lab_over);
2288 gimplify_and_add (t, pre_p);
2292 /* Given the base array pointer (__array) and index to the subsequent
2293 argument (__va_ndx), find the address:
2295 __array + (AP).__va_ndx - (BYTES_BIG_ENDIAN && sizeof (TYPE) < 4
2296 ? sizeof (TYPE)
2297 : __va_size (TYPE))
2299 The results are endian-dependent because values smaller than one word
2300 are aligned differently. */
2303 if (BYTES_BIG_ENDIAN && TREE_CODE (type_size) == INTEGER_CST)
2305 t = size_int (PARM_BOUNDARY / BITS_PER_UNIT);
2306 t = fold_build2 (GE_EXPR, boolean_type_node, type_size, t);
2307 t = fold_build3 (COND_EXPR, sizetype, t, va_size, type_size);
2308 size = t;
2310 else
2311 size = va_size;
2313 t = fold_convert (ptr_type_node, ndx);
2314 addr = build2 (PLUS_EXPR, ptr_type_node, array, t);
2315 t = fold_convert (ptr_type_node, size);
2316 addr = build2 (MINUS_EXPR, ptr_type_node, addr, t);
2318 addr = fold_convert (build_pointer_type (type), addr);
2319 if (indirect)
2320 addr = build_va_arg_indirect_ref (addr);
2321 return build_va_arg_indirect_ref (addr);
2325 enum reg_class
2326 xtensa_preferred_reload_class (rtx x, enum reg_class class, int isoutput)
2328 if (!isoutput && CONSTANT_P (x) && GET_CODE (x) == CONST_DOUBLE)
2329 return NO_REGS;
2331 /* Don't use the stack pointer or hard frame pointer for reloads!
2332 The hard frame pointer would normally be OK except that it may
2333 briefly hold an incoming argument in the prologue, and reload
2334 won't know that it is live because the hard frame pointer is
2335 treated specially. */
2337 if (class == AR_REGS || class == GR_REGS)
2338 return RL_REGS;
2340 return class;
2344 enum reg_class
2345 xtensa_secondary_reload_class (enum reg_class class,
2346 enum machine_mode mode ATTRIBUTE_UNUSED,
2347 rtx x, int isoutput)
2349 int regno;
2351 if (GET_CODE (x) == SIGN_EXTEND)
2352 x = XEXP (x, 0);
2353 regno = xt_true_regnum (x);
2355 if (!isoutput)
2357 if (class == FP_REGS && constantpool_mem_p (x))
2358 return RL_REGS;
2361 if (ACC_REG_P (regno))
2362 return ((class == GR_REGS || class == RL_REGS) ? NO_REGS : RL_REGS);
2363 if (class == ACC_REG)
2364 return (GP_REG_P (regno) ? NO_REGS : RL_REGS);
2366 return NO_REGS;
2370 void
2371 order_regs_for_local_alloc (void)
2373 if (!leaf_function_p ())
2375 memcpy (reg_alloc_order, reg_nonleaf_alloc_order,
2376 FIRST_PSEUDO_REGISTER * sizeof (int));
2378 else
2380 int i, num_arg_regs;
2381 int nxt = 0;
2383 /* Use the AR registers in increasing order (skipping a0 and a1)
2384 but save the incoming argument registers for a last resort. */
2385 num_arg_regs = current_function_args_info.arg_words;
2386 if (num_arg_regs > MAX_ARGS_IN_REGISTERS)
2387 num_arg_regs = MAX_ARGS_IN_REGISTERS;
2388 for (i = GP_ARG_FIRST; i < 16 - num_arg_regs; i++)
2389 reg_alloc_order[nxt++] = i + num_arg_regs;
2390 for (i = 0; i < num_arg_regs; i++)
2391 reg_alloc_order[nxt++] = GP_ARG_FIRST + i;
2393 /* List the coprocessor registers in order. */
2394 for (i = 0; i < BR_REG_NUM; i++)
2395 reg_alloc_order[nxt++] = BR_REG_FIRST + i;
2397 /* List the FP registers in order for now. */
2398 for (i = 0; i < 16; i++)
2399 reg_alloc_order[nxt++] = FP_REG_FIRST + i;
2401 /* GCC requires that we list *all* the registers.... */
2402 reg_alloc_order[nxt++] = 0; /* a0 = return address */
2403 reg_alloc_order[nxt++] = 1; /* a1 = stack pointer */
2404 reg_alloc_order[nxt++] = 16; /* pseudo frame pointer */
2405 reg_alloc_order[nxt++] = 17; /* pseudo arg pointer */
2407 reg_alloc_order[nxt++] = ACC_REG_FIRST; /* MAC16 accumulator */
2412 /* Some Xtensa targets support multiple bss sections. If the section
2413 name ends with ".bss", add SECTION_BSS to the flags. */
2415 static unsigned int
2416 xtensa_multibss_section_type_flags (tree decl, const char *name, int reloc)
2418 unsigned int flags = default_section_type_flags (decl, name, reloc);
2419 const char *suffix;
2421 suffix = strrchr (name, '.');
2422 if (suffix && strcmp (suffix, ".bss") == 0)
2424 if (!decl || (TREE_CODE (decl) == VAR_DECL
2425 && DECL_INITIAL (decl) == NULL_TREE))
2426 flags |= SECTION_BSS; /* @nobits */
2427 else
2428 warning (0, "only uninitialized variables can be placed in a "
2429 ".bss section");
2432 return flags;
2436 /* The literal pool stays with the function. */
2438 static section *
2439 xtensa_select_rtx_section (enum machine_mode mode ATTRIBUTE_UNUSED,
2440 rtx x ATTRIBUTE_UNUSED,
2441 unsigned HOST_WIDE_INT align ATTRIBUTE_UNUSED)
2443 return function_section (current_function_decl);
2447 /* Compute a (partial) cost for rtx X. Return true if the complete
2448 cost has been computed, and false if subexpressions should be
2449 scanned. In either case, *TOTAL contains the cost result. */
2451 static bool
2452 xtensa_rtx_costs (rtx x, int code, int outer_code, int *total)
2454 switch (code)
2456 case CONST_INT:
2457 switch (outer_code)
2459 case SET:
2460 if (xtensa_simm12b (INTVAL (x)))
2462 *total = 4;
2463 return true;
2465 break;
2466 case PLUS:
2467 if (xtensa_simm8 (INTVAL (x))
2468 || xtensa_simm8x256 (INTVAL (x)))
2470 *total = 0;
2471 return true;
2473 break;
2474 case AND:
2475 if (xtensa_mask_immediate (INTVAL (x)))
2477 *total = 0;
2478 return true;
2480 break;
2481 case COMPARE:
2482 if ((INTVAL (x) == 0) || xtensa_b4const (INTVAL (x)))
2484 *total = 0;
2485 return true;
2487 break;
2488 case ASHIFT:
2489 case ASHIFTRT:
2490 case LSHIFTRT:
2491 case ROTATE:
2492 case ROTATERT:
2493 /* No way to tell if X is the 2nd operand so be conservative. */
2494 default: break;
2496 if (xtensa_simm12b (INTVAL (x)))
2497 *total = 5;
2498 else if (TARGET_CONST16)
2499 *total = COSTS_N_INSNS (2);
2500 else
2501 *total = 6;
2502 return true;
2504 case CONST:
2505 case LABEL_REF:
2506 case SYMBOL_REF:
2507 if (TARGET_CONST16)
2508 *total = COSTS_N_INSNS (2);
2509 else
2510 *total = 5;
2511 return true;
2513 case CONST_DOUBLE:
2514 if (TARGET_CONST16)
2515 *total = COSTS_N_INSNS (4);
2516 else
2517 *total = 7;
2518 return true;
2520 case MEM:
2522 int num_words =
2523 (GET_MODE_SIZE (GET_MODE (x)) > UNITS_PER_WORD) ? 2 : 1;
2525 if (memory_address_p (GET_MODE (x), XEXP ((x), 0)))
2526 *total = COSTS_N_INSNS (num_words);
2527 else
2528 *total = COSTS_N_INSNS (2*num_words);
2529 return true;
2532 case FFS:
2533 *total = COSTS_N_INSNS (TARGET_NSA ? 5 : 50);
2534 return true;
2536 case NOT:
2537 *total = COSTS_N_INSNS ((GET_MODE (x) == DImode) ? 3 : 2);
2538 return true;
2540 case AND:
2541 case IOR:
2542 case XOR:
2543 if (GET_MODE (x) == DImode)
2544 *total = COSTS_N_INSNS (2);
2545 else
2546 *total = COSTS_N_INSNS (1);
2547 return true;
2549 case ASHIFT:
2550 case ASHIFTRT:
2551 case LSHIFTRT:
2552 if (GET_MODE (x) == DImode)
2553 *total = COSTS_N_INSNS (50);
2554 else
2555 *total = COSTS_N_INSNS (1);
2556 return true;
2558 case ABS:
2560 enum machine_mode xmode = GET_MODE (x);
2561 if (xmode == SFmode)
2562 *total = COSTS_N_INSNS (TARGET_HARD_FLOAT ? 1 : 50);
2563 else if (xmode == DFmode)
2564 *total = COSTS_N_INSNS (50);
2565 else
2566 *total = COSTS_N_INSNS (4);
2567 return true;
2570 case PLUS:
2571 case MINUS:
2573 enum machine_mode xmode = GET_MODE (x);
2574 if (xmode == SFmode)
2575 *total = COSTS_N_INSNS (TARGET_HARD_FLOAT ? 1 : 50);
2576 else if (xmode == DFmode || xmode == DImode)
2577 *total = COSTS_N_INSNS (50);
2578 else
2579 *total = COSTS_N_INSNS (1);
2580 return true;
2583 case NEG:
2584 *total = COSTS_N_INSNS ((GET_MODE (x) == DImode) ? 4 : 2);
2585 return true;
2587 case MULT:
2589 enum machine_mode xmode = GET_MODE (x);
2590 if (xmode == SFmode)
2591 *total = COSTS_N_INSNS (TARGET_HARD_FLOAT ? 4 : 50);
2592 else if (xmode == DFmode || xmode == DImode)
2593 *total = COSTS_N_INSNS (50);
2594 else if (TARGET_MUL32)
2595 *total = COSTS_N_INSNS (4);
2596 else if (TARGET_MAC16)
2597 *total = COSTS_N_INSNS (16);
2598 else if (TARGET_MUL16)
2599 *total = COSTS_N_INSNS (12);
2600 else
2601 *total = COSTS_N_INSNS (50);
2602 return true;
2605 case DIV:
2606 case MOD:
2608 enum machine_mode xmode = GET_MODE (x);
2609 if (xmode == SFmode)
2611 *total = COSTS_N_INSNS (TARGET_HARD_FLOAT_DIV ? 8 : 50);
2612 return true;
2614 else if (xmode == DFmode)
2616 *total = COSTS_N_INSNS (50);
2617 return true;
2620 /* Fall through. */
2622 case UDIV:
2623 case UMOD:
2625 enum machine_mode xmode = GET_MODE (x);
2626 if (xmode == DImode)
2627 *total = COSTS_N_INSNS (50);
2628 else if (TARGET_DIV32)
2629 *total = COSTS_N_INSNS (32);
2630 else
2631 *total = COSTS_N_INSNS (50);
2632 return true;
2635 case SQRT:
2636 if (GET_MODE (x) == SFmode)
2637 *total = COSTS_N_INSNS (TARGET_HARD_FLOAT_SQRT ? 8 : 50);
2638 else
2639 *total = COSTS_N_INSNS (50);
2640 return true;
2642 case SMIN:
2643 case UMIN:
2644 case SMAX:
2645 case UMAX:
2646 *total = COSTS_N_INSNS (TARGET_MINMAX ? 1 : 50);
2647 return true;
2649 case SIGN_EXTRACT:
2650 case SIGN_EXTEND:
2651 *total = COSTS_N_INSNS (TARGET_SEXT ? 1 : 2);
2652 return true;
2654 case ZERO_EXTRACT:
2655 case ZERO_EXTEND:
2656 *total = COSTS_N_INSNS (1);
2657 return true;
2659 default:
2660 return false;
2664 /* Worker function for TARGET_RETURN_IN_MEMORY. */
2666 static bool
2667 xtensa_return_in_memory (tree type, tree fntype ATTRIBUTE_UNUSED)
2669 return ((unsigned HOST_WIDE_INT) int_size_in_bytes (type)
2670 > 4 * UNITS_PER_WORD);
2673 #include "gt-xtensa.h"