gcc/config/sparc/sparc.c

   1 /* Subroutines for insn-output.c for Sun SPARC.
   2    Copyright (C) 1987, 88, 89, 92-97, 1998 Free Software Foundation, Inc.
   3    Contributed by Michael Tiemann (tiemann@cygnus.com)
   4    64 bit SPARC V9 support by Michael Tiemann, Jim Wilson, and Doug Evans,
   5    at Cygnus Support.
   6
   7 This file is part of GNU CC.
   8
   9 GNU CC is free software; you can redistribute it and/or modify
  10 it under the terms of the GNU General Public License as published by
  11 the Free Software Foundation; either version 2, or (at your option)
  12 any later version.
  13
  14 GNU CC is distributed in the hope that it will be useful,
  15 but WITHOUT ANY WARRANTY; without even the implied warranty of
  16 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  17 GNU General Public License for more details.
  18
  19 You should have received a copy of the GNU General Public License
  20 along with GNU CC; see the file COPYING.  If not, write to
  21 the Free Software Foundation, 59 Temple Place - Suite 330,
  22 Boston, MA 02111-1307, USA.  */
  23
  24 #include "config.h"
  25 #include <stdio.h>
  26 #include "tree.h"
  27 #include "rtl.h"
  28 #include "regs.h"
  29 #include "hard-reg-set.h"
  30 #include "real.h"
  31 #include "insn-config.h"
  32 #include "conditions.h"
  33 #include "insn-flags.h"
  34 #include "output.h"
  35 #include "insn-attr.h"
  36 #include "flags.h"
  37 #include "expr.h"
  38 #include "recog.h"
  39
  40 /* 1 if the caller has placed an "unimp" insn immediately after the call.
  41    This is used in v8 code when calling a function that returns a structure.
  42    v9 doesn't have this.  Be careful to have this test be the same as that
  43    used on the call.  */
  44
  45 #define SKIP_CALLERS_UNIMP_P  \
  46 (!TARGET_ARCH64 && current_function_returns_struct                      \
  47  && ! integer_zerop (DECL_SIZE (DECL_RESULT (current_function_decl)))   \
  48  && (TREE_CODE (DECL_SIZE (DECL_RESULT (current_function_decl)))        \
  49      == INTEGER_CST))
  50
  51 /* Global variables for machine-dependent things.  */
  52
  53 /* Size of frame.  Need to know this to emit return insns from leaf procedures.
  54    ACTUAL_FSIZE is set by compute_frame_size() which is called during the
  55    reload pass.  This is important as the value is later used in insn
  56    scheduling (to see what can go in a delay slot).
  57    APPARENT_FSIZE is the size of the stack less the register save area and less
  58    the outgoing argument area.  It is used when saving call preserved regs.  */
  59 static int apparent_fsize;
  60 static int actual_fsize;
  61
  62 /* Save the operands last given to a compare for use when we
  63    generate a scc or bcc insn.  */
  64
  65 rtx sparc_compare_op0, sparc_compare_op1;
  66
  67 /* We may need an epilogue if we spill too many registers.
  68    If this is non-zero, then we branch here for the epilogue.  */
  69 static rtx leaf_label;
  70
  71 #ifdef LEAF_REGISTERS
  72
  73 /* Vector to say how input registers are mapped to output
  74    registers.  FRAME_POINTER_REGNUM cannot be remapped by
  75    this function to eliminate it.  You must use -fomit-frame-pointer
  76    to get that.  */
  77 char leaf_reg_remap[] =
  78 { 0, 1, 2, 3, 4, 5, 6, 7,
  79   -1, -1, -1, -1, -1, -1, 14, -1,
  80   -1, -1, -1, -1, -1, -1, -1, -1,
  81   8, 9, 10, 11, 12, 13, -1, 15,
  82
  83   32, 33, 34, 35, 36, 37, 38, 39,
  84   40, 41, 42, 43, 44, 45, 46, 47,
  85   48, 49, 50, 51, 52, 53, 54, 55,
  86   56, 57, 58, 59, 60, 61, 62, 63,
  87   64, 65, 66, 67, 68, 69, 70, 71,
  88   72, 73, 74, 75, 76, 77, 78, 79,
  89   80, 81, 82, 83, 84, 85, 86, 87,
  90   88, 89, 90, 91, 92, 93, 94, 95,
  91   96, 97, 98, 99, 100};
  92
  93 #endif
  94
  95 /* Name of where we pretend to think the frame pointer points.
  96    Normally, this is "%fp", but if we are in a leaf procedure,
  97    this is "%sp+something".  We record "something" separately as it may be
  98    too big for reg+constant addressing.  */
  99
 100 static char *frame_base_name;
 101 static int frame_base_offset;
 102
 103 static rtx pic_setup_code       PROTO((void));
 104 static rtx find_addr_reg        PROTO((rtx));
 105 static void sparc_init_modes    PROTO((void));
 106 static int save_regs            PROTO((FILE *, int, int, char *,
 107                                        int, int, int));
 108 static int restore_regs         PROTO((FILE *, int, int, char *, int, int));
 109 static void build_big_number    PROTO((FILE *, int, char *));
 110 static function_arg_slotno      PROTO((const CUMULATIVE_ARGS *,
 111                                        enum machine_mode, tree, int, int,
 112                                        int *, int *));
 113
 114 #ifdef DWARF2_DEBUGGING_INFO
 115 extern char *dwarf2out_cfi_label ();
 116 #endif
 117 \f
 118 /* Option handling.  */
 119
 120 /* Code model option as passed by user.  */
 121 char *sparc_cmodel_string;
 122 /* Parsed value.  */
 123 enum cmodel sparc_cmodel;
 124
 125 /* Record alignment options as passed by user.  */
 126 char *sparc_align_loops_string;
 127 char *sparc_align_jumps_string;
 128 char *sparc_align_funcs_string;
 129
 130 /* Parsed values, as a power of two.  */
 131 int sparc_align_loops;
 132 int sparc_align_jumps;
 133 int sparc_align_funcs;
 134
 135 struct sparc_cpu_select sparc_select[] =
 136 {
 137   /* switch     name,           tune    arch */
 138   { (char *)0,  "default",      1,      1 },
 139   { (char *)0,  "-mcpu=",       1,      1 },
 140   { (char *)0,  "-mtune=",      1,      0 },
 141   { 0, 0 }
 142 };
 143
 144 /* CPU type.  This is set from TARGET_CPU_DEFAULT and -m{cpu,tune}=xxx.  */
 145 enum processor_type sparc_cpu;
 146
 147 /* Validate and override various options, and do some machine dependent
 148    initialization.  */
 149
 150 void
 151 sparc_override_options ()
 152 {
 153   static struct code_model {
 154     char *name;
 155     int value;
 156   } cmodels[] = {
 157     { "32", CM_32 },
 158     { "medlow", CM_MEDLOW },
 159     { "medmid", CM_MEDMID },
 160     { "medany", CM_MEDANY },
 161     { "embmedany", CM_EMBMEDANY },
 162     { 0, 0 }
 163   };
 164   struct code_model *cmodel;
 165   /* Map TARGET_CPU_DEFAULT to value for -m{arch,tune}=.  */
 166   static struct cpu_default {
 167     int cpu;
 168     char *name;
 169   } cpu_default[] = {
 170     /* There must be one entry here for each TARGET_CPU value.  */
 171     { TARGET_CPU_sparc, "cypress" },
 172     { TARGET_CPU_sparclet, "tsc701" },
 173     { TARGET_CPU_sparclite, "f930" },
 174     { TARGET_CPU_v8, "v8" },
 175     { TARGET_CPU_supersparc, "supersparc" },
 176     { TARGET_CPU_v9, "v9" },
 177     { TARGET_CPU_ultrasparc, "ultrasparc" },
 178     { 0 }
 179   };
 180   struct cpu_default *def;
 181   /* Table of values for -m{cpu,tune}=.  */
 182   static struct cpu_table {
 183     char *name;
 184     enum processor_type processor;
 185     int disable;
 186     int enable;
 187   } cpu_table[] = {
 188     { "v7",         PROCESSOR_V7, MASK_ISA, 0 },
 189     { "cypress",    PROCESSOR_CYPRESS, MASK_ISA, 0 },
 190     { "v8",         PROCESSOR_V8, MASK_ISA, MASK_V8 },
 191     /* TI TMS390Z55 supersparc */
 192     { "supersparc", PROCESSOR_SUPERSPARC, MASK_ISA, MASK_V8 },
 193     { "sparclite",  PROCESSOR_SPARCLITE, MASK_ISA, MASK_SPARCLITE },
 194     /* The Fujitsu MB86930 is the original sparclite chip, with no fpu.
 195        The Fujitsu MB86934 is the recent sparclite chip, with an fpu.  */
 196     { "f930",       PROCESSOR_F930, MASK_ISA|MASK_FPU, MASK_SPARCLITE },
 197     { "f934",       PROCESSOR_F934, MASK_ISA, MASK_SPARCLITE|MASK_FPU },
 198     { "sparclet",   PROCESSOR_SPARCLET, MASK_ISA, MASK_SPARCLET },
 199     /* TEMIC sparclet */
 200     { "tsc701",     PROCESSOR_TSC701, MASK_ISA, MASK_SPARCLET },
 201     /* "v8plus" is what Sun calls Solaris2.5 running on UltraSPARC's.  */
 202     { "v8plus",     PROCESSOR_V8PLUS, MASK_ISA, MASK_V9 },
 203     { "v9",         PROCESSOR_V9, MASK_ISA, MASK_V9 },
 204     /* TI ultrasparc */
 205     { "ultrasparc", PROCESSOR_ULTRASPARC, MASK_ISA, MASK_V9 },
 206     { 0 }
 207   };
 208   struct cpu_table *cpu;
 209   struct sparc_cpu_select *sel;
 210   int fpu;
 211
 212 #ifndef SPARC_BI_ARCH
 213   /* Check for unsupported architecture size.  */
 214   if (! TARGET_64BIT != DEFAULT_ARCH32_P)
 215     {
 216       error ("%s is not supported by this configuration",
 217              DEFAULT_ARCH32_P ? "-m64" : "-m32");
 218     }
 219 #endif
 220
 221   /* Code model selection.  */
 222   sparc_cmodel = SPARC_DEFAULT_CMODEL;
 223   if (sparc_cmodel_string != NULL)
 224     {
 225       if (TARGET_ARCH64)
 226         {
 227           for (cmodel = &cmodels[0]; cmodel->name; cmodel++)
 228             if (strcmp (sparc_cmodel_string, cmodel->name) == 0)
 229               break;
 230           if (cmodel->name == NULL)
 231             error ("bad value (%s) for -mcmodel= switch", sparc_cmodel_string);
 232           else
 233             sparc_cmodel = cmodel->value;
 234         }
 235       else
 236         error ("-mcmodel= is not supported on 32 bit systems");
 237     }
 238
 239   fpu = TARGET_FPU; /* save current -mfpu status */
 240
 241   /* Set the default CPU.  */
 242   for (def = &cpu_default[0]; def->name; ++def)
 243     if (def->cpu == TARGET_CPU_DEFAULT)
 244       break;
 245   if (! def->name)
 246     abort ();
 247   sparc_select[0].string = def->name;
 248
 249   for (sel = &sparc_select[0]; sel->name; ++sel)
 250     {
 251       if (sel->string)
 252         {
 253           for (cpu = &cpu_table[0]; cpu->name; ++cpu)
 254             if (! strcmp (sel->string, cpu->name))
 255               {
 256                 if (sel->set_tune_p)
 257                   sparc_cpu = cpu->processor;
 258
 259                 if (sel->set_arch_p)
 260                   {
 261                     target_flags &= ~cpu->disable;
 262                     target_flags |= cpu->enable;
 263                   }
 264                 break;
 265               }
 266
 267           if (! cpu->name)
 268             error ("bad value (%s) for %s switch", sel->string, sel->name);
 269         }
 270     }
 271
 272   /* If -mfpu or -mno-fpu was explicitly used, don't override with
 273      the processor default.  */
 274   if (TARGET_FPU_SET)
 275     target_flags = (target_flags & ~MASK_FPU) | fpu;
 276
 277   /* Use the deprecated v8 insns for sparc64 in 32 bit mode.  */
 278   if (TARGET_V9 && TARGET_ARCH32)
 279     target_flags |= MASK_DEPRECATED_V8_INSNS;
 280
 281   /* Validate -malign-loops= value, or provide default.  */
 282   if (sparc_align_loops_string)
 283     {
 284       sparc_align_loops = exact_log2 (atoi (sparc_align_loops_string));
 285       if (sparc_align_loops < 2 || sparc_align_loops > 7)
 286         fatal ("-malign-loops=%s is not between 4 and 128 or is not a power of two",
 287                sparc_align_loops_string);
 288     }
 289   else
 290     {
 291       /* ??? This relies on ASM_OUTPUT_ALIGN to not emit the alignment if
 292          its 0.  This sounds a bit kludgey.  */
 293       sparc_align_loops = 0;
 294     }
 295
 296   /* Validate -malign-jumps= value, or provide default.  */
 297   if (sparc_align_jumps_string)
 298     {
 299       sparc_align_jumps = exact_log2 (atoi (sparc_align_jumps_string));
 300       if (sparc_align_jumps < 2 || sparc_align_loops > 7)
 301         fatal ("-malign-jumps=%s is not between 4 and 128 or is not a power of two",
 302                sparc_align_jumps_string);
 303     }
 304   else
 305     {
 306       /* ??? This relies on ASM_OUTPUT_ALIGN to not emit the alignment if
 307          its 0.  This sounds a bit kludgey.  */
 308       sparc_align_jumps = 0;
 309     }
 310
 311   /* Validate -malign-functions= value, or provide default. */
 312   if (sparc_align_funcs_string)
 313     {
 314       sparc_align_funcs = exact_log2 (atoi (sparc_align_funcs_string));
 315       if (sparc_align_funcs < 2 || sparc_align_loops > 7)
 316         fatal ("-malign-functions=%s is not between 4 and 128 or is not a power of two",
 317                sparc_align_funcs_string);
 318     }
 319   else
 320     sparc_align_funcs = DEFAULT_SPARC_ALIGN_FUNCS;
 321
 322   /* Do various machine dependent initializations.  */
 323   sparc_init_modes ();
 324 }
 325 \f
 326 /* Float conversions (v9 only).
 327
 328    The floating point registers cannot hold DImode values because SUBREG's
 329    on them get the wrong register.   "(subreg:SI (reg:DI M int-reg) 0)" is the
 330    same as "(subreg:SI (reg:DI N float-reg) 1)", but gcc doesn't know how to
 331    turn the "0" to a "1".  Therefore, we must explicitly do the conversions
 332    to/from int/fp regs.  `sparc64_fpconv_stack_slot' is the address of an
 333    8 byte stack slot used during the transfer.
 334    ??? I could have used [%fp-16] but I didn't want to add yet another
 335    dependence on this.  */
 336 /* ??? Can we use assign_stack_temp here?  */
 337
 338 static rtx fpconv_stack_temp;
 339
 340 /* Called once for each function.  */
 341
 342 void
 343 sparc_init_expanders ()
 344 {
 345   fpconv_stack_temp = NULL_RTX;
 346 }
 347
 348 /* Assign a stack temp for fp/int DImode conversions.  */
 349
 350 rtx
 351 sparc64_fpconv_stack_temp ()
 352 {
 353   if (fpconv_stack_temp == NULL_RTX)
 354     fpconv_stack_temp =
 355       assign_stack_local (DImode, GET_MODE_SIZE (DImode), 0);
 356
 357   return fpconv_stack_temp;
 358 }
 359 \f
 360 /* Miscellaneous utilities.  */
 361
 362 /* Nonzero if CODE, a comparison, is suitable for use in v9 conditional move
 363    or branch on register contents instructions.  */
 364
 365 int
 366 v9_regcmp_p (code)
 367      enum rtx_code code;
 368 {
 369   return (code == EQ || code == NE || code == GE || code == LT
 370           || code == LE || code == GT);
 371 }
 372 \f
 373 /* Operand constraints.  */
 374
 375 /* Return non-zero only if OP is a register of mode MODE,
 376    or const0_rtx.  Don't allow const0_rtx if TARGET_LIVE_G0 because
 377    %g0 may contain anything.  */
 378
 379 int
 380 reg_or_0_operand (op, mode)
 381      rtx op;
 382      enum machine_mode mode;
 383 {
 384   if (register_operand (op, mode))
 385     return 1;
 386   if (TARGET_LIVE_G0)
 387     return 0;
 388   if (op == const0_rtx)
 389     return 1;
 390   if (GET_MODE (op) == VOIDmode && GET_CODE (op) == CONST_DOUBLE
 391       && CONST_DOUBLE_HIGH (op) == 0
 392       && CONST_DOUBLE_LOW (op) == 0)
 393     return 1;
 394   if (GET_MODE_CLASS (GET_MODE (op)) == MODE_FLOAT
 395       && GET_CODE (op) == CONST_DOUBLE
 396       && fp_zero_operand (op))
 397     return 1;
 398   return 0;
 399 }
 400
 401 /* Nonzero if OP is a floating point value with value 0.0.  */
 402
 403 int
 404 fp_zero_operand (op)
 405      rtx op;
 406 {
 407   REAL_VALUE_TYPE r;
 408
 409   REAL_VALUE_FROM_CONST_DOUBLE (r, op);
 410   return (REAL_VALUES_EQUAL (r, dconst0) && ! REAL_VALUE_MINUS_ZERO (r));
 411 }
 412
 413 /* Nonzero if OP is an integer register.  */
 414
 415 int
 416 intreg_operand (op, mode)
 417      rtx op;
 418      enum machine_mode mode;
 419 {
 420   return (register_operand (op, SImode)
 421           || (TARGET_ARCH64 && register_operand (op, DImode)));
 422 }
 423
 424 /* Nonzero if OP is a floating point condition code register.  */
 425
 426 int
 427 fcc_reg_operand (op, mode)
 428      rtx op;
 429      enum machine_mode mode;
 430 {
 431   /* This can happen when recog is called from combine.  Op may be a MEM.
 432      Fail instead of calling abort in this case.  */
 433   if (GET_CODE (op) != REG)
 434     return 0;
 435
 436   if (mode != VOIDmode && mode != GET_MODE (op))
 437     return 0;
 438   if (mode == VOIDmode
 439       && (GET_MODE (op) != CCFPmode && GET_MODE (op) != CCFPEmode))
 440     return 0;
 441
 442 #if 0   /* ??? ==> 1 when %fcc0-3 are pseudos first.  See gen_compare_reg().  */
 443   if (reg_renumber == 0)
 444     return REGNO (op) >= FIRST_PSEUDO_REGISTER;
 445   return REGNO_OK_FOR_CCFP_P (REGNO (op));
 446 #else
 447   return (unsigned) REGNO (op) - SPARC_FIRST_V9_FCC_REG < 4;
 448 #endif
 449 }
 450
 451 /* Nonzero if OP is an integer or floating point condition code register.  */
 452
 453 int
 454 icc_or_fcc_reg_operand (op, mode)
 455      rtx op;
 456      enum machine_mode mode;
 457 {
 458   if (GET_CODE (op) == REG && REGNO (op) == SPARC_ICC_REG)
 459     {
 460       if (mode != VOIDmode && mode != GET_MODE (op))
 461         return 0;
 462       if (mode == VOIDmode
 463           && GET_MODE (op) != CCmode && GET_MODE (op) != CCXmode)
 464         return 0;
 465       return 1;
 466     }
 467
 468   return fcc_reg_operand (op, mode);
 469 }
 470
 471 /* Nonzero if OP can appear as the dest of a RESTORE insn.  */
 472 int
 473 restore_operand (op, mode)
 474      rtx op;
 475      enum machine_mode mode;
 476 {
 477   return (GET_CODE (op) == REG && GET_MODE (op) == mode
 478           && (REGNO (op) < 8 || (REGNO (op) >= 24 && REGNO (op) < 32)));
 479 }
 480
 481 /* Call insn on SPARC can take a PC-relative constant address, or any regular
 482    memory address.  */
 483
 484 int
 485 call_operand (op, mode)
 486      rtx op;
 487      enum machine_mode mode;
 488 {
 489   if (GET_CODE (op) != MEM)
 490     abort ();
 491   op = XEXP (op, 0);
 492   return (symbolic_operand (op, mode) || memory_address_p (Pmode, op));
 493 }
 494
 495 int
 496 call_operand_address (op, mode)
 497      rtx op;
 498      enum machine_mode mode;
 499 {
 500   return (symbolic_operand (op, mode) || memory_address_p (Pmode, op));
 501 }
 502
 503 /* Returns 1 if OP is either a symbol reference or a sum of a symbol
 504    reference and a constant.  */
 505
 506 int
 507 symbolic_operand (op, mode)
 508      register rtx op;
 509      enum machine_mode mode;
 510 {
 511   switch (GET_CODE (op))
 512     {
 513     case SYMBOL_REF:
 514     case LABEL_REF:
 515       return 1;
 516
 517     case CONST:
 518       op = XEXP (op, 0);
 519       return ((GET_CODE (XEXP (op, 0)) == SYMBOL_REF
 520                || GET_CODE (XEXP (op, 0)) == LABEL_REF)
 521               && GET_CODE (XEXP (op, 1)) == CONST_INT);
 522
 523       /* ??? This clause seems to be irrelevant.  */
 524     case CONST_DOUBLE:
 525       return GET_MODE (op) == mode;
 526
 527     default:
 528       return 0;
 529     }
 530 }
 531
 532 /* Return truth value of statement that OP is a symbolic memory
 533    operand of mode MODE.  */
 534
 535 int
 536 symbolic_memory_operand (op, mode)
 537      rtx op;
 538      enum machine_mode mode;
 539 {
 540   if (GET_CODE (op) == SUBREG)
 541     op = SUBREG_REG (op);
 542   if (GET_CODE (op) != MEM)
 543     return 0;
 544   op = XEXP (op, 0);
 545   return (GET_CODE (op) == SYMBOL_REF || GET_CODE (op) == CONST
 546           || GET_CODE (op) == HIGH || GET_CODE (op) == LABEL_REF);
 547 }
 548
 549 /* Return truth value of statement that OP is a LABEL_REF of mode MODE.  */
 550
 551 int
 552 label_ref_operand (op, mode)
 553      rtx op;
 554      enum machine_mode mode;
 555 {
 556   if (GET_CODE (op) != LABEL_REF)
 557     return 0;
 558   if (GET_MODE (op) != mode)
 559     return 0;
 560   return 1;
 561 }
 562
 563 /* Return 1 if the operand is an argument used in generating pic references
 564    in either the medium/low or medium/anywhere code models of sparc64.  */
 565
 566 int
 567 sp64_medium_pic_operand (op, mode)
 568      rtx op;
 569      enum machine_mode mode;
 570 {
 571   /* Check for (const (minus (symbol_ref:GOT)
 572                              (const (minus (label) (pc))))).  */
 573   if (GET_CODE (op) != CONST)
 574     return 0;
 575   op = XEXP (op, 0);
 576   if (GET_CODE (op) != MINUS)
 577     return 0;
 578   if (GET_CODE (XEXP (op, 0)) != SYMBOL_REF)
 579     return 0;
 580   /* ??? Ensure symbol is GOT.  */
 581   if (GET_CODE (XEXP (op, 1)) != CONST)
 582     return 0;
 583   if (GET_CODE (XEXP (XEXP (op, 1), 0)) != MINUS)
 584     return 0;
 585   return 1;
 586 }
 587
 588 /* Return 1 if the operand is a data segment reference.  This includes
 589    the readonly data segment, or in other words anything but the text segment.
 590    This is needed in the medium/anywhere code model on v9.  These values
 591    are accessed with EMBMEDANY_BASE_REG.  */
 592
 593 int
 594 data_segment_operand (op, mode)
 595      rtx op;
 596      enum machine_mode mode;
 597 {
 598   switch (GET_CODE (op))
 599     {
 600     case SYMBOL_REF :
 601       return ! SYMBOL_REF_FLAG (op);
 602     case PLUS :
 603       /* Assume canonical format of symbol + constant.
 604          Fall through.  */
 605     case CONST :
 606       return data_segment_operand (XEXP (op, 0));
 607     default :
 608       return 0;
 609     }
 610 }
 611
 612 /* Return 1 if the operand is a text segment reference.
 613    This is needed in the medium/anywhere code model on v9.  */
 614
 615 int
 616 text_segment_operand (op, mode)
 617      rtx op;
 618      enum machine_mode mode;
 619 {
 620   switch (GET_CODE (op))
 621     {
 622     case LABEL_REF :
 623       return 1;
 624     case SYMBOL_REF :
 625       return SYMBOL_REF_FLAG (op);
 626     case PLUS :
 627       /* Assume canonical format of symbol + constant.
 628          Fall through.  */
 629     case CONST :
 630       return text_segment_operand (XEXP (op, 0));
 631     default :
 632       return 0;
 633     }
 634 }
 635
 636 /* Return 1 if the operand is either a register or a memory operand that is
 637    not symbolic.  */
 638
 639 int
 640 reg_or_nonsymb_mem_operand (op, mode)
 641     register rtx op;
 642     enum machine_mode mode;
 643 {
 644   if (register_operand (op, mode))
 645     return 1;
 646
 647   if (memory_operand (op, mode) && ! symbolic_memory_operand (op, mode))
 648     return 1;
 649
 650   return 0;
 651 }
 652
 653 int
 654 sparc_operand (op, mode)
 655      rtx op;
 656      enum machine_mode mode;
 657 {
 658   if (register_operand (op, mode))
 659     return 1;
 660   if (GET_CODE (op) == CONST_INT)
 661     return SMALL_INT (op);
 662   if (GET_MODE (op) != mode)
 663     return 0;
 664   if (GET_CODE (op) == SUBREG)
 665     op = SUBREG_REG (op);
 666   if (GET_CODE (op) != MEM)
 667     return 0;
 668
 669   op = XEXP (op, 0);
 670   if (GET_CODE (op) == LO_SUM)
 671     return (GET_CODE (XEXP (op, 0)) == REG
 672             && symbolic_operand (XEXP (op, 1), Pmode));
 673   return memory_address_p (mode, op);
 674 }
 675
 676 int
 677 move_operand (op, mode)
 678      rtx op;
 679      enum machine_mode mode;
 680 {
 681   if (mode == DImode && arith_double_operand (op, mode))
 682     return 1;
 683   if (register_operand (op, mode))
 684     return 1;
 685   if (GET_CODE (op) == CONST_INT)
 686     return SMALL_INT (op) || SPARC_SETHI_P (INTVAL (op));
 687
 688   if (GET_MODE (op) != mode)
 689     return 0;
 690   if (GET_CODE (op) == SUBREG)
 691     op = SUBREG_REG (op);
 692   if (GET_CODE (op) != MEM)
 693     return 0;
 694   op = XEXP (op, 0);
 695   if (GET_CODE (op) == LO_SUM)
 696     return (register_operand (XEXP (op, 0), Pmode)
 697             && CONSTANT_P (XEXP (op, 1)));
 698   return memory_address_p (mode, op);
 699 }
 700
 701 int
 702 splittable_symbolic_memory_operand (op, mode)
 703      rtx op;
 704      enum machine_mode mode;
 705 {
 706   if (GET_CODE (op) != MEM)
 707     return 0;
 708   if (! symbolic_operand (XEXP (op, 0), Pmode))
 709     return 0;
 710   return 1;
 711 }
 712
 713 int
 714 splittable_immediate_memory_operand (op, mode)
 715      rtx op;
 716      enum machine_mode mode;
 717 {
 718   if (GET_CODE (op) != MEM)
 719     return 0;
 720   if (! immediate_operand (XEXP (op, 0), Pmode))
 721     return 0;
 722   return 1;
 723 }
 724
 725 /* Return truth value of whether OP is EQ or NE.  */
 726
 727 int
 728 eq_or_neq (op, mode)
 729      rtx op;
 730      enum machine_mode mode;
 731 {
 732   return (GET_CODE (op) == EQ || GET_CODE (op) == NE);
 733 }
 734
 735 /* Return 1 if this is a comparison operator, but not an EQ, NE, GEU,
 736    or LTU for non-floating-point.  We handle those specially.  */
 737
 738 int
 739 normal_comp_operator (op, mode)
 740      rtx op;
 741      enum machine_mode mode;
 742 {
 743   enum rtx_code code = GET_CODE (op);
 744
 745   if (GET_RTX_CLASS (code) != '<')
 746     return 0;
 747
 748   if (GET_MODE (XEXP (op, 0)) == CCFPmode
 749       || GET_MODE (XEXP (op, 0)) == CCFPEmode)
 750     return 1;
 751
 752   return (code != NE && code != EQ && code != GEU && code != LTU);
 753 }
 754
 755 /* Return 1 if this is a comparison operator.  This allows the use of
 756    MATCH_OPERATOR to recognize all the branch insns.  */
 757
 758 int
 759 noov_compare_op (op, mode)
 760     register rtx op;
 761     enum machine_mode mode;
 762 {
 763   enum rtx_code code = GET_CODE (op);
 764
 765   if (GET_RTX_CLASS (code) != '<')
 766     return 0;
 767
 768   if (GET_MODE (XEXP (op, 0)) == CC_NOOVmode)
 769     /* These are the only branches which work with CC_NOOVmode.  */
 770     return (code == EQ || code == NE || code == GE || code == LT);
 771   return 1;
 772 }
 773
 774 /* Nonzero if OP is a comparison operator suitable for use in v9
 775    conditional move or branch on register contents instructions.  */
 776
 777 int
 778 v9_regcmp_op (op, mode)
 779      register rtx op;
 780      enum machine_mode mode;
 781 {
 782   enum rtx_code code = GET_CODE (op);
 783
 784   if (GET_RTX_CLASS (code) != '<')
 785     return 0;
 786
 787   return v9_regcmp_p (code);
 788 }
 789
 790 /* Return 1 if this is a SIGN_EXTEND or ZERO_EXTEND operation.  */
 791
 792 int
 793 extend_op (op, mode)
 794      rtx op;
 795      enum machine_mode mode;
 796 {
 797   return GET_CODE (op) == SIGN_EXTEND || GET_CODE (op) == ZERO_EXTEND;
 798 }
 799
 800 /* Return nonzero if OP is an operator of mode MODE which can set
 801    the condition codes explicitly.  We do not include PLUS and MINUS
 802    because these require CC_NOOVmode, which we handle explicitly.  */
 803
 804 int
 805 cc_arithop (op, mode)
 806      rtx op;
 807      enum machine_mode mode;
 808 {
 809   if (GET_CODE (op) == AND
 810       || GET_CODE (op) == IOR
 811       || GET_CODE (op) == XOR)
 812     return 1;
 813
 814   return 0;
 815 }
 816
 817 /* Return nonzero if OP is an operator of mode MODE which can bitwise
 818    complement its second operand and set the condition codes explicitly.  */
 819
 820 int
 821 cc_arithopn (op, mode)
 822      rtx op;
 823      enum machine_mode mode;
 824 {
 825   /* XOR is not here because combine canonicalizes (xor (not ...) ...)
 826      and (xor ... (not ...)) to (not (xor ...)).   */
 827   return (GET_CODE (op) == AND
 828           || GET_CODE (op) == IOR);
 829 }
 830 \f
 831 /* Return true if OP is a register, or is a CONST_INT that can fit in a
 832    signed 13 bit immediate field.  This is an acceptable SImode operand for
 833    most 3 address instructions.  */
 834
 835 int
 836 arith_operand (op, mode)
 837      rtx op;
 838      enum machine_mode mode;
 839 {
 840   return (register_operand (op, mode)
 841           || (GET_CODE (op) == CONST_INT && SMALL_INT (op)));
 842 }
 843
 844 /* Return true if OP is a register, or is a CONST_INT that can fit in a
 845    signed 11 bit immediate field.  This is an acceptable SImode operand for
 846    the movcc instructions.  */
 847
 848 int
 849 arith11_operand (op, mode)
 850      rtx op;
 851      enum machine_mode mode;
 852 {
 853   return (register_operand (op, mode)
 854           || (GET_CODE (op) == CONST_INT && SPARC_SIMM11_P (INTVAL (op))));
 855 }
 856
 857 /* Return true if OP is a register, or is a CONST_INT that can fit in a
 858    signed 10 bit immediate field.  This is an acceptable SImode operand for
 859    the movrcc instructions.  */
 860
 861 int
 862 arith10_operand (op, mode)
 863      rtx op;
 864      enum machine_mode mode;
 865 {
 866   return (register_operand (op, mode)
 867           || (GET_CODE (op) == CONST_INT && SPARC_SIMM10_P (INTVAL (op))));
 868 }
 869
 870 /* Return true if OP is a register, is a CONST_INT that fits in a 13 bit
 871    immediate field, or is a CONST_DOUBLE whose both parts fit in a 13 bit
 872    immediate field.
 873    v9: Return true if OP is a register, or is a CONST_INT or CONST_DOUBLE that
 874    can fit in a 13 bit immediate field.  This is an acceptable DImode operand
 875    for most 3 address instructions.  */
 876
 877 int
 878 arith_double_operand (op, mode)
 879      rtx op;
 880      enum machine_mode mode;
 881 {
 882   return (register_operand (op, mode)
 883           || (GET_CODE (op) == CONST_INT && SMALL_INT (op))
 884           || (! TARGET_ARCH64
 885               && GET_CODE (op) == CONST_DOUBLE
 886               && (unsigned HOST_WIDE_INT) (CONST_DOUBLE_LOW (op) + 0x1000) < 0x2000
 887               && (unsigned HOST_WIDE_INT) (CONST_DOUBLE_HIGH (op) + 0x1000) < 0x2000)
 888           || (TARGET_ARCH64
 889               && GET_CODE (op) == CONST_DOUBLE
 890               && (unsigned HOST_WIDE_INT) (CONST_DOUBLE_LOW (op) + 0x1000) < 0x2000
 891               && ((CONST_DOUBLE_HIGH (op) == -1
 892                    && (CONST_DOUBLE_LOW (op) & 0x1000) == 0x1000)
 893                   || (CONST_DOUBLE_HIGH (op) == 0
 894                       && (CONST_DOUBLE_LOW (op) & 0x1000) == 0))));
 895 }
 896
 897 /* Return true if OP is a register, or is a CONST_INT or CONST_DOUBLE that
 898    can fit in an 11 bit immediate field.  This is an acceptable DImode
 899    operand for the movcc instructions.  */
 900 /* ??? Replace with arith11_operand?  */
 901
 902 int
 903 arith11_double_operand (op, mode)
 904      rtx op;
 905      enum machine_mode mode;
 906 {
 907   return (register_operand (op, mode)
 908           || (GET_CODE (op) == CONST_DOUBLE
 909               && (GET_MODE (op) == mode || GET_MODE (op) == VOIDmode)
 910               && (unsigned HOST_WIDE_INT) (CONST_DOUBLE_LOW (op) + 0x400) < 0x800
 911               && ((CONST_DOUBLE_HIGH (op) == -1
 912                    && (CONST_DOUBLE_LOW (op) & 0x400) == 0x400)
 913                   || (CONST_DOUBLE_HIGH (op) == 0
 914                       && (CONST_DOUBLE_LOW (op) & 0x400) == 0)))
 915           || (GET_CODE (op) == CONST_INT
 916               && (GET_MODE (op) == mode || GET_MODE (op) == VOIDmode)
 917               && (unsigned HOST_WIDE_INT) (INTVAL (op) + 0x400) < 0x800));
 918 }
 919
 920 /* Return true if OP is a register, or is a CONST_INT or CONST_DOUBLE that
 921    can fit in an 10 bit immediate field.  This is an acceptable DImode
 922    operand for the movrcc instructions.  */
 923 /* ??? Replace with arith10_operand?  */
 924
 925 int
 926 arith10_double_operand (op, mode)
 927      rtx op;
 928      enum machine_mode mode;
 929 {
 930   return (register_operand (op, mode)
 931           || (GET_CODE (op) == CONST_DOUBLE
 932               && (GET_MODE (op) == mode || GET_MODE (op) == VOIDmode)
 933               && (unsigned) (CONST_DOUBLE_LOW (op) + 0x200) < 0x400
 934               && ((CONST_DOUBLE_HIGH (op) == -1
 935                    && (CONST_DOUBLE_LOW (op) & 0x200) == 0x200)
 936                   || (CONST_DOUBLE_HIGH (op) == 0
 937                       && (CONST_DOUBLE_LOW (op) & 0x200) == 0)))
 938           || (GET_CODE (op) == CONST_INT
 939               && (GET_MODE (op) == mode || GET_MODE (op) == VOIDmode)
 940               && (unsigned HOST_WIDE_INT) (INTVAL (op) + 0x200) < 0x400));
 941 }
 942
 943 /* Return truth value of whether OP is a integer which fits the
 944    range constraining immediate operands in most three-address insns,
 945    which have a 13 bit immediate field.  */
 946
 947 int
 948 small_int (op, mode)
 949      rtx op;
 950      enum machine_mode mode;
 951 {
 952   return (GET_CODE (op) == CONST_INT && SMALL_INT (op));
 953 }
 954
 955 /* Recognize operand values for the umul instruction.  That instruction sign
 956    extends immediate values just like all other sparc instructions, but
 957    interprets the extended result as an unsigned number.  */
 958
 959 int
 960 uns_small_int (op, mode)
 961      rtx op;
 962      enum machine_mode mode;
 963 {
 964 #if HOST_BITS_PER_WIDE_INT > 32
 965   /* All allowed constants will fit a CONST_INT.  */
 966   return (GET_CODE (op) == CONST_INT
 967           && ((INTVAL (op) >= 0 && INTVAL (op) < 0x1000)
 968               || (INTVAL (op) >= 0xFFFFF000 && INTVAL (op) < 0x100000000L)));
 969 #else
 970   return ((GET_CODE (op) == CONST_INT && (unsigned) INTVAL (op) < 0x1000)
 971           || (GET_CODE (op) == CONST_DOUBLE
 972               && CONST_DOUBLE_HIGH (op) == 0
 973               && (unsigned) CONST_DOUBLE_LOW (op) - 0xFFFFF000 < 0x1000));
 974 #endif
 975 }
 976
 977 int
 978 uns_arith_operand (op, mode)
 979      rtx op;
 980      enum machine_mode mode;
 981 {
 982   return register_operand (op, mode) || uns_small_int (op, mode);
 983 }
 984
 985 /* Return truth value of statement that OP is a call-clobbered register.  */
 986 int
 987 clobbered_register (op, mode)
 988      rtx op;
 989      enum machine_mode mode;
 990 {
 991   return (GET_CODE (op) == REG && call_used_regs[REGNO (op)]);
 992 }
 993 \f
 994 /* X and Y are two things to compare using CODE.  Emit the compare insn and
 995    return the rtx for the cc reg in the proper mode.  */
 996
 997 rtx
 998 gen_compare_reg (code, x, y)
 999      enum rtx_code code;
1000      rtx x, y;
1001 {
1002   enum machine_mode mode = SELECT_CC_MODE (code, x, y);
1003   rtx cc_reg;
1004
1005   /* ??? We don't have movcc patterns so we cannot generate pseudo regs for the
1006      fcc regs (cse can't tell they're really call clobbered regs and will
1007      remove a duplicate comparison even if there is an intervening function
1008      call - it will then try to reload the cc reg via an int reg which is why
1009      we need the movcc patterns).  It is possible to provide the movcc
1010      patterns by using the ldxfsr/stxfsr v9 insns.  I tried it: you need two
1011      registers (say %g1,%g5) and it takes about 6 insns.  A better fix would be
1012      to tell cse that CCFPE mode registers (even pseudos) are call
1013      clobbered.  */
1014
1015   /* ??? This is an experiment.  Rather than making changes to cse which may
1016      or may not be easy/clean, we do our own cse.  This is possible because
1017      we will generate hard registers.  Cse knows they're call clobbered (it
1018      doesn't know the same thing about pseudos). If we guess wrong, no big
1019      deal, but if we win, great!  */
1020
1021   if (TARGET_V9 && GET_MODE_CLASS (GET_MODE (x)) == MODE_FLOAT)
1022 #if 1 /* experiment */
1023     {
1024       int reg;
1025       /* We cycle through the registers to ensure they're all exercised.  */
1026       static int next_fcc_reg = 0;
1027       /* Previous x,y for each fcc reg.  */
1028       static rtx prev_args[4][2];
1029
1030       /* Scan prev_args for x,y.  */
1031       for (reg = 0; reg < 4; reg++)
1032         if (prev_args[reg][0] == x && prev_args[reg][1] == y)
1033           break;
1034       if (reg == 4)
1035         {
1036           reg = next_fcc_reg;
1037           prev_args[reg][0] = x;
1038           prev_args[reg][1] = y;
1039           next_fcc_reg = (next_fcc_reg + 1) & 3;
1040         }
1041       cc_reg = gen_rtx (REG, mode, reg + SPARC_FIRST_V9_FCC_REG);
1042     }
1043 #else
1044     cc_reg = gen_reg_rtx (mode);
1045 #endif /* ! experiment */
1046   else if (GET_MODE_CLASS (GET_MODE (x)) == MODE_FLOAT)
1047     cc_reg = gen_rtx (REG, mode, SPARC_FCC_REG);
1048   else
1049     cc_reg = gen_rtx (REG, mode, SPARC_ICC_REG);
1050
1051   emit_insn (gen_rtx (SET, VOIDmode, cc_reg,
1052                       gen_rtx (COMPARE, mode, x, y)));
1053
1054   return cc_reg;
1055 }
1056
1057 /* This function is used for v9 only.
1058    CODE is the code for an Scc's comparison.
1059    OPERANDS[0] is the target of the Scc insn.
1060    OPERANDS[1] is the value we compare against const0_rtx (which hasn't
1061    been generated yet).
1062
1063    This function is needed to turn
1064
1065            (set (reg:SI 110)
1066                (gt (reg:CCX 100 %icc)
1067                    (const_int 0)))
1068    into
1069            (set (reg:SI 110)
1070                (gt:DI (reg:CCX 100 %icc)
1071                    (const_int 0)))
1072
1073    IE: The instruction recognizer needs to see the mode of the comparison to
1074    find the right instruction. We could use "gt:DI" right in the
1075    define_expand, but leaving it out allows us to handle DI, SI, etc.
1076
1077    We refer to the global sparc compare operands sparc_compare_op0 and
1078    sparc_compare_op1.  */
1079
1080 int
1081 gen_v9_scc (compare_code, operands)
1082      enum rtx_code compare_code;
1083      register rtx *operands;
1084 {
1085   rtx temp, op0, op1;
1086
1087   if (! TARGET_ARCH64
1088       && (GET_MODE (sparc_compare_op0) == DImode
1089           || GET_MODE (operands[0]) == DImode))
1090     return 0;
1091
1092   /* Handle the case where operands[0] == sparc_compare_op0.
1093      We "early clobber" the result.  */
1094   if (REGNO (operands[0]) == REGNO (sparc_compare_op0))
1095     {
1096       op0 = gen_reg_rtx (GET_MODE (sparc_compare_op0));
1097       emit_move_insn (op0, sparc_compare_op0);
1098     }
1099   else
1100     op0 = sparc_compare_op0;
1101   /* For consistency in the following.  */
1102   op1 = sparc_compare_op1;
1103
1104   /* Try to use the movrCC insns.  */
1105   if (TARGET_ARCH64
1106       && GET_MODE_CLASS (GET_MODE (op0)) == MODE_INT
1107       && op1 == const0_rtx
1108       && v9_regcmp_p (compare_code))
1109     {
1110       /* Special case for op0 != 0.  This can be done with one instruction if
1111          operands[0] == sparc_compare_op0.  We don't assume they are equal
1112          now though.  */
1113
1114       if (compare_code == NE
1115           && GET_MODE (operands[0]) == DImode
1116           && GET_MODE (op0) == DImode)
1117         {
1118           emit_insn (gen_rtx (SET, VOIDmode, operands[0], op0));
1119           emit_insn (gen_rtx (SET, VOIDmode, operands[0],
1120                               gen_rtx (IF_THEN_ELSE, DImode,
1121                                        gen_rtx (compare_code, DImode,
1122                                                 op0, const0_rtx),
1123                                        const1_rtx,
1124                                        operands[0])));
1125           return 1;
1126         }
1127
1128       emit_insn (gen_rtx (SET, VOIDmode, operands[0], const0_rtx));
1129       if (GET_MODE (op0) != DImode)
1130         {
1131           temp = gen_reg_rtx (DImode);
1132           convert_move (temp, op0, 0);
1133         }
1134       else
1135         temp = op0;
1136       emit_insn (gen_rtx (SET, VOIDmode, operands[0],
1137                           gen_rtx (IF_THEN_ELSE, GET_MODE (operands[0]),
1138                                    gen_rtx (compare_code, DImode,
1139                                             temp, const0_rtx),
1140                                    const1_rtx,
1141                                    operands[0])));
1142       return 1;
1143     }
1144   else
1145     {
1146       operands[1] = gen_compare_reg (compare_code, op0, op1);
1147
1148       switch (GET_MODE (operands[1]))
1149         {
1150           case CCmode :
1151           case CCXmode :
1152           case CCFPEmode :
1153           case CCFPmode :
1154             break;
1155           default :
1156             abort ();
1157         }
1158       emit_insn (gen_rtx (SET, VOIDmode, operands[0], const0_rtx));
1159       emit_insn (gen_rtx (SET, VOIDmode, operands[0],
1160                           gen_rtx (IF_THEN_ELSE, GET_MODE (operands[0]),
1161                                    gen_rtx (compare_code,
1162                                             GET_MODE (operands[1]),
1163                                             operands[1], const0_rtx),
1164                                     const1_rtx, operands[0])));
1165       return 1;
1166     }
1167 }
1168
1169 /* Emit a conditional jump insn for the v9 architecture using comparison code
1170    CODE and jump target LABEL.
1171    This function exists to take advantage of the v9 brxx insns.  */
1172
1173 void
1174 emit_v9_brxx_insn (code, op0, label)
1175      enum rtx_code code;
1176      rtx op0, label;
1177 {
1178   emit_jump_insn (gen_rtx (SET, VOIDmode,
1179                            pc_rtx,
1180                            gen_rtx (IF_THEN_ELSE, VOIDmode,
1181                                     gen_rtx (code, GET_MODE (op0),
1182                                              op0, const0_rtx),
1183                                     gen_rtx (LABEL_REF, VOIDmode, label),
1184                                     pc_rtx)));
1185 }
1186 \f
1187 /* Return nonzero if a return peephole merging return with
1188    setting of output register is ok.  */
1189 int
1190 leaf_return_peephole_ok ()
1191 {
1192   return (actual_fsize == 0);
1193 }
1194
1195 /* Return nonzero if TRIAL can go into the function epilogue's
1196    delay slot.  SLOT is the slot we are trying to fill.  */
1197
1198 int
1199 eligible_for_epilogue_delay (trial, slot)
1200      rtx trial;
1201      int slot;
1202 {
1203   rtx pat, src;
1204
1205   if (slot >= 1)
1206     return 0;
1207
1208   if (GET_CODE (trial) != INSN || GET_CODE (PATTERN (trial)) != SET)
1209     return 0;
1210
1211   if (get_attr_length (trial) != 1)
1212     return 0;
1213
1214   /* If %g0 is live, there are lots of things we can't handle.
1215      Rather than trying to find them all now, let's punt and only
1216      optimize things as necessary.  */
1217   if (TARGET_LIVE_G0)
1218     return 0;
1219
1220   /* In the case of a true leaf function, anything can go into the delay slot.
1221      A delay slot only exists however if the frame size is zero, otherwise
1222      we will put an insn to adjust the stack after the return.  */
1223   if (leaf_function)
1224     {
1225       if (leaf_return_peephole_ok ())
1226         return ((get_attr_in_uncond_branch_delay (trial)
1227                  == IN_BRANCH_DELAY_TRUE));
1228       return 0;
1229     }
1230
1231   /* If only trivial `restore' insns work, nothing can go in the
1232      delay slot.  */
1233   else if (TARGET_BROKEN_SAVERESTORE)
1234     return 0;
1235
1236   pat = PATTERN (trial);
1237
1238   /* Otherwise, only operations which can be done in tandem with
1239      a `restore' insn can go into the delay slot.  */
1240   if (GET_CODE (SET_DEST (pat)) != REG
1241       || REGNO (SET_DEST (pat)) >= 32
1242       || REGNO (SET_DEST (pat)) < 24)
1243     return 0;
1244
1245   /* The set of insns matched here must agree precisely with the set of
1246      patterns paired with a RETURN in sparc.md.  */
1247
1248   src = SET_SRC (pat);
1249
1250   /* This matches "*return_[qhs]".  */
1251   if (arith_operand (src, GET_MODE (src)))
1252     return GET_MODE_SIZE (GET_MODE (src)) <= GET_MODE_SIZE (SImode);
1253
1254   /* This matches "*return_di".  */
1255   else if (arith_double_operand (src, GET_MODE (src)))
1256     return GET_MODE_SIZE (GET_MODE (src)) <= GET_MODE_SIZE (DImode);
1257
1258   /* This matches "*return_sf_no_fpu".  */
1259   else if (! TARGET_FPU && restore_operand (SET_DEST (pat), SFmode)
1260            && register_operand (src, SFmode))
1261     return 1;
1262
1263   /* This matches "*return_addsi".  */
1264   else if (GET_CODE (src) == PLUS
1265            && arith_operand (XEXP (src, 0), SImode)
1266            && arith_operand (XEXP (src, 1), SImode)
1267            && (register_operand (XEXP (src, 0), SImode)
1268                || register_operand (XEXP (src, 1), SImode)))
1269     return 1;
1270
1271   /* This matches "*return_adddi".  */
1272   else if (GET_CODE (src) == PLUS
1273            && arith_double_operand (XEXP (src, 0), DImode)
1274            && arith_double_operand (XEXP (src, 1), DImode)
1275            && (register_operand (XEXP (src, 0), DImode)
1276                || register_operand (XEXP (src, 1), DImode)))
1277     return 1;
1278
1279   /* This matches "*return_subsi".  */
1280   else if (GET_CODE (src) == MINUS
1281       && register_operand (XEXP (src, 0), SImode)
1282       && small_int (XEXP (src, 1), VOIDmode)
1283       && INTVAL (XEXP (src, 1)) != -4096)
1284     return 1;
1285
1286   return 0;
1287 }
1288
1289 int
1290 short_branch (uid1, uid2)
1291      int uid1, uid2;
1292 {
1293   unsigned int delta = insn_addresses[uid1] - insn_addresses[uid2];
1294   if (delta + 1024 < 2048)
1295     return 1;
1296   /* warning ("long branch, distance %d", delta); */
1297   return 0;
1298 }
1299
1300 /* Return non-zero if REG is not used after INSN.
1301    We assume REG is a reload reg, and therefore does
1302    not live past labels or calls or jumps.  */
1303 int
1304 reg_unused_after (reg, insn)
1305      rtx reg;
1306      rtx insn;
1307 {
1308   enum rtx_code code, prev_code = UNKNOWN;
1309
1310   while (insn = NEXT_INSN (insn))
1311     {
1312       if (prev_code == CALL_INSN && call_used_regs[REGNO (reg)])
1313         return 1;
1314
1315       code = GET_CODE (insn);
1316       if (GET_CODE (insn) == CODE_LABEL)
1317         return 1;
1318
1319       if (GET_RTX_CLASS (code) == 'i')
1320         {
1321           rtx set = single_set (insn);
1322           int in_src = set && reg_overlap_mentioned_p (reg, SET_SRC (set));
1323           if (set && in_src)
1324             return 0;
1325           if (set && reg_overlap_mentioned_p (reg, SET_DEST (set)))
1326             return 1;
1327           if (set == 0 && reg_overlap_mentioned_p (reg, PATTERN (insn)))
1328             return 0;
1329         }
1330       prev_code = code;
1331     }
1332   return 1;
1333 }
1334 \f
1335 /* The table we use to reference PIC data.  */
1336 static rtx global_offset_table;
1337
1338 /* Ensure that we are not using patterns that are not OK with PIC.  */
1339
1340 int
1341 check_pic (i)
1342      int i;
1343 {
1344   switch (flag_pic)
1345     {
1346     case 1:
1347       if (GET_CODE (recog_operand[i]) == SYMBOL_REF
1348           || (GET_CODE (recog_operand[i]) == CONST
1349               && ! (GET_CODE (XEXP (recog_operand[i], 0)) == MINUS
1350                     && (XEXP (XEXP (recog_operand[i], 0), 0)
1351                         == global_offset_table)
1352                     && (GET_CODE (XEXP (XEXP (recog_operand[i], 0), 1))
1353                         == CONST))))
1354         abort ();
1355     case 2:
1356     default:
1357       return 1;
1358     }
1359 }
1360
1361 /* Return true if X is an address which needs a temporary register when
1362    reloaded while generating PIC code.  */
1363
1364 int
1365 pic_address_needs_scratch (x)
1366      rtx x;
1367 {
1368   /* An address which is a symbolic plus a non SMALL_INT needs a temp reg.  */
1369   if (GET_CODE (x) == CONST && GET_CODE (XEXP (x, 0)) == PLUS
1370       && GET_CODE (XEXP (XEXP (x, 0), 0)) == SYMBOL_REF
1371       && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
1372       && ! SMALL_INT (XEXP (XEXP (x, 0), 1)))
1373     return 1;
1374
1375   return 0;
1376 }
1377
1378 /* Legitimize PIC addresses.  If the address is already position-independent,
1379    we return ORIG.  Newly generated position-independent addresses go into a
1380    reg.  This is REG if non zero, otherwise we allocate register(s) as
1381    necessary.  */
1382
1383 rtx
1384 legitimize_pic_address (orig, mode, reg)
1385      rtx orig;
1386      enum machine_mode mode;
1387      rtx reg;
1388 {
1389   if (GET_CODE (orig) == SYMBOL_REF)
1390     {
1391       rtx pic_ref, address;
1392       rtx insn;
1393
1394       if (reg == 0)
1395         {
1396           if (reload_in_progress || reload_completed)
1397             abort ();
1398           else
1399             reg = gen_reg_rtx (Pmode);
1400         }
1401
1402       if (flag_pic == 2)
1403         {
1404           /* If not during reload, allocate another temp reg here for loading
1405              in the address, so that these instructions can be optimized
1406              properly.  */
1407           rtx temp_reg = ((reload_in_progress || reload_completed)
1408                           ? reg : gen_reg_rtx (Pmode));
1409
1410           /* Must put the SYMBOL_REF inside an UNSPEC here so that cse
1411              won't get confused into thinking that these two instructions
1412              are loading in the true address of the symbol.  If in the
1413              future a PIC rtx exists, that should be used instead.  */
1414           emit_insn (gen_pic_sethi_si (temp_reg, orig));
1415           emit_insn (gen_pic_lo_sum_si (temp_reg, temp_reg, orig));
1416
1417           address = temp_reg;
1418         }
1419       else
1420         address = orig;
1421
1422       pic_ref = gen_rtx (MEM, Pmode,
1423                          gen_rtx (PLUS, Pmode,
1424                                   pic_offset_table_rtx, address));
1425       current_function_uses_pic_offset_table = 1;
1426       RTX_UNCHANGING_P (pic_ref) = 1;
1427       insn = emit_move_insn (reg, pic_ref);
1428       /* Put a REG_EQUAL note on this insn, so that it can be optimized
1429          by loop.  */
1430       REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_EQUAL, orig,
1431                                   REG_NOTES (insn));
1432       return reg;
1433     }
1434   else if (GET_CODE (orig) == CONST)
1435     {
1436       rtx base, offset;
1437
1438       if (GET_CODE (XEXP (orig, 0)) == PLUS
1439           && XEXP (XEXP (orig, 0), 0) == pic_offset_table_rtx)
1440         return orig;
1441
1442       if (reg == 0)
1443         {
1444           if (reload_in_progress || reload_completed)
1445             abort ();
1446           else
1447             reg = gen_reg_rtx (Pmode);
1448         }
1449
1450       if (GET_CODE (XEXP (orig, 0)) == PLUS)
1451         {
1452           base = legitimize_pic_address (XEXP (XEXP (orig, 0), 0), Pmode, reg);
1453           offset = legitimize_pic_address (XEXP (XEXP (orig, 0), 1), Pmode,
1454                                          base == reg ? 0 : reg);
1455         }
1456       else
1457         abort ();
1458
1459       if (GET_CODE (offset) == CONST_INT)
1460         {
1461           if (SMALL_INT (offset))
1462             return plus_constant_for_output (base, INTVAL (offset));
1463           else if (! reload_in_progress && ! reload_completed)
1464             offset = force_reg (Pmode, offset);
1465           else
1466             /* If we reach here, then something is seriously wrong.  */
1467             abort ();
1468         }
1469       return gen_rtx (PLUS, Pmode, base, offset);
1470     }
1471   else if (GET_CODE (orig) == LABEL_REF)
1472     /* ??? Why do we do this?  */
1473     current_function_uses_pic_offset_table = 1;
1474
1475   return orig;
1476 }
1477
1478 /* Set up PIC-specific rtl.  This should not cause any insns
1479    to be emitted.  */
1480
1481 void
1482 initialize_pic ()
1483 {
1484 }
1485
1486 /* Return the RTX for insns to set the PIC register.  */
1487
1488 static rtx
1489 pic_setup_code ()
1490 {
1491   rtx pic_pc_rtx;
1492   rtx l1, l2;
1493   rtx seq;
1494
1495   start_sequence ();
1496
1497   /* If -O0, show the PIC register remains live before this.  */
1498   if (obey_regdecls)
1499     emit_insn (gen_rtx (USE, VOIDmode, pic_offset_table_rtx));
1500
1501   l1 = gen_label_rtx ();
1502
1503   pic_pc_rtx = gen_rtx (CONST, Pmode,
1504                         gen_rtx (MINUS, Pmode,
1505                                  global_offset_table,
1506                                  gen_rtx (CONST, Pmode,
1507                                           gen_rtx (MINUS, Pmode,
1508                                                    gen_rtx (LABEL_REF,
1509                                                             VOIDmode, l1),
1510                                                    pc_rtx))));
1511
1512   /* sparc64: the RDPC instruction doesn't pair, and puts 4 bubbles in the
1513      pipe to boot.  So don't use it here, especially when we're
1514      doing a save anyway because of %l7.  */
1515
1516   l2 = gen_label_rtx ();
1517   emit_label (l1);
1518
1519   /* Iff we are doing delay branch optimization, slot the sethi up
1520      here so that it will fill the delay slot of the call.  */
1521   if (flag_delayed_branch)
1522     emit_insn (gen_rtx (SET, VOIDmode, pic_offset_table_rtx,
1523                         gen_rtx (HIGH, Pmode, pic_pc_rtx)));
1524
1525   /* Note that we pun calls and jumps here!  */
1526   emit_jump_insn (gen_get_pc_via_call (l2, l1));
1527
1528   emit_label (l2);
1529
1530   if (!flag_delayed_branch)
1531     emit_insn (gen_rtx (SET, VOIDmode, pic_offset_table_rtx,
1532                         gen_rtx (HIGH, Pmode, pic_pc_rtx)));
1533
1534   emit_insn (gen_rtx (SET, VOIDmode,
1535                       pic_offset_table_rtx,
1536                       gen_rtx (LO_SUM, Pmode,
1537                                pic_offset_table_rtx, pic_pc_rtx)));
1538   emit_insn (gen_rtx (SET, VOIDmode,
1539                       pic_offset_table_rtx,
1540                       gen_rtx (PLUS, Pmode,
1541                                pic_offset_table_rtx,
1542                                gen_rtx (REG, Pmode, 15))));
1543
1544   /* emit_insn (gen_rtx (ASM_INPUT, VOIDmode, "!#PROLOGUE# 1")); */
1545   LABEL_PRESERVE_P (l1) = 1;
1546   LABEL_PRESERVE_P (l2) = 1;
1547
1548   seq = gen_sequence ();
1549   end_sequence ();
1550
1551   return seq;
1552 }
1553
1554 /* Emit special PIC prologues and epilogues.  */
1555
1556 void
1557 finalize_pic ()
1558 {
1559   /* Labels to get the PC in the prologue of this function.  */
1560   int orig_flag_pic = flag_pic;
1561   rtx insn;
1562
1563   if (current_function_uses_pic_offset_table == 0)
1564     return;
1565
1566   if (! flag_pic)
1567     abort ();
1568
1569   /* Initialize every time through, since we can't easily
1570      know this to be permanent.  */
1571   global_offset_table = gen_rtx (SYMBOL_REF, Pmode, "_GLOBAL_OFFSET_TABLE_");
1572   flag_pic = 0;
1573
1574   emit_insn_after (pic_setup_code (), get_insns ());
1575
1576   /* Insert the code in each nonlocal goto receiver.  */
1577   for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
1578     if (GET_CODE (insn) == INSN && GET_CODE (PATTERN (insn)) == UNSPEC_VOLATILE
1579         && XINT (PATTERN (insn), 1) == 4)
1580       emit_insn_after (pic_setup_code (), insn);
1581
1582   flag_pic = orig_flag_pic;
1583
1584   /* Need to emit this whether or not we obey regdecls,
1585      since setjmp/longjmp can cause life info to screw up.
1586      ??? In the case where we don't obey regdecls, this is not sufficient
1587      since we may not fall out the bottom.  */
1588   emit_insn (gen_rtx (USE, VOIDmode, pic_offset_table_rtx));
1589 }
1590 \f
1591 /* Emit insns to move operands[1] into operands[0].
1592
1593    Return 1 if we have written out everything that needs to be done to
1594    do the move.  Otherwise, return 0 and the caller will emit the move
1595    normally.  */
1596
1597 int
1598 emit_move_sequence (operands, mode)
1599      rtx *operands;
1600      enum machine_mode mode;
1601 {
1602   register rtx operand0 = operands[0];
1603   register rtx operand1 = operands[1];
1604
1605   if (CONSTANT_P (operand1) && flag_pic
1606       && pic_address_needs_scratch (operand1))
1607     operands[1] = operand1 = legitimize_pic_address (operand1, mode, 0);
1608
1609   /* Handle most common case first: storing into a register.  */
1610   if (register_operand (operand0, mode))
1611     {
1612       if (register_operand (operand1, mode)
1613           || (GET_CODE (operand1) == CONST_INT && SMALL_INT (operand1))
1614           || (GET_CODE (operand1) == CONST_DOUBLE
1615               && arith_double_operand (operand1, DImode))
1616           || (GET_CODE (operand1) == HIGH && GET_MODE (operand1) != DImode)
1617           /* Only `general_operands' can come here, so MEM is ok.  */
1618           || GET_CODE (operand1) == MEM)
1619         {
1620           /* Run this case quickly.  */
1621           emit_insn (gen_rtx (SET, VOIDmode, operand0, operand1));
1622           return 1;
1623         }
1624     }
1625   else if (GET_CODE (operand0) == MEM)
1626     {
1627       if (register_operand (operand1, mode)
1628           || (operand1 == const0_rtx && ! TARGET_LIVE_G0))
1629         {
1630           /* Run this case quickly.  */
1631           emit_insn (gen_rtx (SET, VOIDmode, operand0, operand1));
1632           return 1;
1633         }
1634       if (! reload_in_progress)
1635         {
1636           operands[0] = validize_mem (operand0);
1637           operands[1] = operand1 = force_reg (mode, operand1);
1638         }
1639     }
1640
1641   if (GET_CODE (operand1) == LABEL_REF
1642       && mode == SImode && flag_pic)
1643     {
1644       if (TARGET_ARCH64)
1645         abort ();
1646       emit_insn (gen_move_pic_label_si (operand0, operand1));
1647       return 1;
1648     }
1649   /* Non-pic LABEL_REF's in sparc64 are expensive to do the normal way,
1650      so always use special code.  */
1651   else if (GET_CODE (operand1) == LABEL_REF
1652            && mode == DImode)
1653     {
1654       if (! TARGET_ARCH64)
1655         abort ();
1656       emit_insn (gen_move_label_di (operand0, operand1));
1657       return 1;
1658     }
1659   /* DImode HIGH values in sparc64 need a clobber added.  */
1660   else if (TARGET_ARCH64
1661       && GET_CODE (operand1) == HIGH && GET_MODE (operand1) == DImode)
1662     {
1663       emit_insn (gen_sethi_di_sp64 (operand0, XEXP (operand1, 0)));
1664       return 1;
1665     }
1666   /* Simplify the source if we need to.  */
1667   else if (GET_CODE (operand1) != HIGH && immediate_operand (operand1, mode))
1668     {
1669       if (flag_pic && symbolic_operand (operand1, mode))
1670         {
1671           rtx temp_reg = reload_in_progress ? operand0 : 0;
1672
1673           operands[1] = legitimize_pic_address (operand1, mode, temp_reg);
1674         }
1675       else if (GET_CODE (operand1) == CONST_INT
1676                ? (! SMALL_INT (operand1)
1677                   && ! SPARC_SETHI_P (INTVAL (operand1)))
1678                : GET_CODE (operand1) == CONST_DOUBLE
1679                ? ! arith_double_operand (operand1, DImode)
1680                : 1)
1681         {
1682           /* For DImode values, temp must be operand0 because of the way
1683              HI and LO_SUM work.  The LO_SUM operator only copies half of
1684              the LSW from the dest of the HI operator.  If the LO_SUM dest is
1685              not the same as the HI dest, then the MSW of the LO_SUM dest will
1686              never be set.
1687
1688              ??? The real problem here is that the ...(HI:DImode pattern emits
1689              multiple instructions, and the ...(LO_SUM:DImode pattern emits
1690              one instruction.  This fails, because the compiler assumes that
1691              LO_SUM copies all bits of the first operand to its dest.  Better
1692              would be to have the HI pattern emit one instruction and the
1693              LO_SUM pattern multiple instructions.  Even better would be
1694              to use four rtl insns.  */
1695           rtx temp = ((reload_in_progress || mode == DImode)
1696                       ? operand0 : gen_reg_rtx (mode));
1697
1698           if (TARGET_ARCH64 && mode == DImode)
1699             emit_insn (gen_sethi_di_sp64 (temp, operand1));
1700           else
1701             emit_insn (gen_rtx (SET, VOIDmode, temp,
1702                                 gen_rtx (HIGH, mode, operand1)));
1703
1704           if (GET_CODE (operand1) == CONST_INT)
1705             operand1 = GEN_INT (INTVAL (operand1) & 0xffffffff);
1706           else if (GET_CODE (operand1) == CONST_DOUBLE)
1707             operand1 = GEN_INT (CONST_DOUBLE_LOW (operand1) & 0xffffffff);
1708           operands[1] = gen_rtx (LO_SUM, mode, temp, operand1);
1709         }
1710     }
1711
1712   /* Now have insn-emit do whatever it normally does.  */
1713   return 0;
1714 }
1715 \f
1716 /* Return the best assembler insn template
1717    for moving operands[1] into operands[0] as a 4 byte quantity.
1718
1719    This isn't intended to be very smart.  It is up to the caller to
1720    choose the best way to do things.
1721
1722    Note that OPERANDS may be modified to suit the returned string.  */
1723
1724 char *
1725 singlemove_string (operands)
1726      rtx *operands;
1727 {
1728   if (GET_CODE (operands[0]) == MEM)
1729     {
1730       if (GET_CODE (operands[1]) != MEM)
1731         return "st %r1,%0";
1732       else
1733         abort ();
1734     }
1735   else if (GET_CODE (operands[1]) == MEM)
1736     return "ld %1,%0";
1737   else if (GET_CODE (operands[1]) == CONST_DOUBLE)
1738     {
1739       REAL_VALUE_TYPE r;
1740       long i;
1741
1742       /* Must be SFmode, otherwise this doesn't make sense.  */
1743       if (GET_MODE (operands[1]) != SFmode)
1744         abort ();
1745
1746       REAL_VALUE_FROM_CONST_DOUBLE (r, operands[1]);
1747       REAL_VALUE_TO_TARGET_SINGLE (r, i);
1748       operands[1] = GEN_INT (i);
1749
1750       if (CONST_OK_FOR_LETTER_P (i, 'I'))
1751         return "mov %1,%0";
1752       else if ((i & 0x000003FF) != 0)
1753         return "sethi %%hi(%a1),%0\n\tor %0,%%lo(%a1),%0";
1754       else
1755         return "sethi %%hi(%a1),%0";
1756     }
1757   else if (GET_CODE (operands[1]) == CONST_INT
1758            && ! CONST_OK_FOR_LETTER_P (INTVAL (operands[1]), 'I'))
1759     {
1760       HOST_WIDE_INT i = INTVAL (operands[1]);
1761
1762       /* If all low order 10 bits are clear, then we only need a single
1763          sethi insn to load the constant.  */
1764       /* FIXME: Use SETHI_P.  */
1765       if ((i & 0x000003FF) != 0)
1766         return "sethi %%hi(%a1),%0\n\tor %0,%%lo(%a1),%0";
1767       else
1768         return "sethi %%hi(%a1),%0";
1769     }
1770   /* Operand 1 must be a register, or a 'I' type CONST_INT.  */
1771   return "mov %1,%0";
1772 }
1773
1774 /* Return the best assembler insn template
1775    for moving operands[1] into operands[0] as an 8 byte quantity.
1776
1777    This isn't intended to be very smart.  It is up to the caller to
1778    choose the best way to do things.
1779
1780    Note that OPERANDS may be modified to suit the returned string.  */
1781
1782 char *
1783 doublemove_string (operands)
1784      rtx *operands;
1785 {
1786   rtx op0 = operands[0], op1 = operands[1];
1787
1788   if (GET_CODE (op0) == MEM)
1789     {
1790       if (GET_CODE (op1) == REG)
1791         {
1792           if (FP_REG_P (op1))
1793             return "std %1,%0";
1794           return TARGET_ARCH64 ? "stx %1,%0" : "std %1,%0";
1795         }
1796       if (TARGET_ARCH64
1797           && (op1 == const0_rtx
1798               || (GET_MODE (op1) != VOIDmode
1799                   && op1 == CONST0_RTX (GET_MODE (op1)))))
1800         return "stx %r1,%0";
1801       abort ();
1802     }
1803   else if (GET_CODE (op1) == MEM)
1804     {
1805       if (GET_CODE (op0) != REG)
1806         abort ();
1807       if (FP_REG_P (op0))
1808         return "ldd %1,%0";
1809       return TARGET_ARCH64 ? "ldx %1,%0" : "ldd %1,%0";
1810     }
1811   else if (GET_CODE (operands[1]) == CONST_DOUBLE)
1812     {
1813       /* ??? Unfinished, and maybe not needed.  */
1814       abort ();
1815     }
1816   else if (GET_CODE (operands[1]) == CONST_INT
1817            && ! CONST_OK_FOR_LETTER_P (INTVAL (operands[1]), 'I'))
1818     {
1819       /* ??? Unfinished, and maybe not needed.  */
1820       abort ();
1821     }
1822   /* Operand 1 must be a register, or a 'I' type CONST_INT.  */
1823   return "mov %1,%0";
1824 }
1825
1826 /* Return non-zero if it is OK to assume that the given memory operand is
1827    aligned at least to a 8-byte boundary.  This should only be called
1828    for memory accesses whose size is 8 bytes or larger.  */
1829
1830 int
1831 mem_aligned_8 (mem)
1832      register rtx mem;
1833 {
1834   register rtx addr;
1835   register rtx base;
1836   register rtx offset;
1837
1838   if (GET_CODE (mem) != MEM)
1839     return 0;   /* It's gotta be a MEM! */
1840
1841   addr = XEXP (mem, 0);
1842
1843   /* Now that all misaligned double parms are copied on function entry,
1844      we can assume any 64-bit object is 64-bit aligned except those which
1845      are at unaligned offsets from the stack or frame pointer.  If the
1846      TARGET_UNALIGNED_DOUBLES switch is given, we do not make this
1847      assumption.  */
1848
1849   /* See what register we use in the address.  */
1850   base = 0;
1851   if (GET_CODE (addr) == PLUS)
1852     {
1853       if (GET_CODE (XEXP (addr, 0)) == REG
1854           && GET_CODE (XEXP (addr, 1)) == CONST_INT)
1855         {
1856           base = XEXP (addr, 0);
1857           offset = XEXP (addr, 1);
1858         }
1859     }
1860   else if (GET_CODE (addr) == REG)
1861     {
1862       base = addr;
1863       offset = const0_rtx;
1864     }
1865
1866   /* If it's the stack or frame pointer, check offset alignment.
1867      We can have improper alignment in the function entry code.  */
1868   if (base
1869       && (REGNO (base) == FRAME_POINTER_REGNUM
1870           || REGNO (base) == STACK_POINTER_REGNUM))
1871     {
1872       if (((INTVAL (offset) - SPARC_STACK_BIAS) & 0x7) == 0)
1873         return 1;
1874     }
1875   /* Anything else we know is properly aligned unless TARGET_UNALIGNED_DOUBLES
1876      is true, in which case we can only assume that an access is aligned if
1877      it is to a constant address, or the address involves a LO_SUM.
1878
1879      We used to assume an address was aligned if MEM_IN_STRUCT_P was true.
1880      That assumption was deleted so that gcc generated code can be used with
1881      memory allocators that only guarantee 4 byte alignment.  */
1882   else if (! TARGET_UNALIGNED_DOUBLES || CONSTANT_P (addr)
1883            || GET_CODE (addr) == LO_SUM)
1884     return 1;
1885
1886   /* An obviously unaligned address.  */
1887   return 0;
1888 }
1889
1890 enum optype { REGOP, OFFSOP, MEMOP, PUSHOP, POPOP, CNSTOP, RNDOP };
1891
1892 /* Output assembler code to perform a doubleword move insn
1893    with operands OPERANDS.  This is very similar to the following
1894    output_move_quad function.  */
1895
1896 char *
1897 output_move_double (operands)
1898      rtx *operands;
1899 {
1900   register rtx op0 = operands[0];
1901   register rtx op1 = operands[1];
1902   register enum optype optype0;
1903   register enum optype optype1;
1904   rtx latehalf[2];
1905   rtx addreg0 = 0;
1906   rtx addreg1 = 0;
1907   int highest_first = 0;
1908   int no_addreg1_decrement = 0;
1909
1910   /* First classify both operands.  */
1911
1912   if (REG_P (op0))
1913     optype0 = REGOP;
1914   else if (offsettable_memref_p (op0))
1915     optype0 = OFFSOP;
1916   else if (GET_CODE (op0) == MEM)
1917     optype0 = MEMOP;
1918   else
1919     optype0 = RNDOP;
1920
1921   if (REG_P (op1))
1922     optype1 = REGOP;
1923   else if (CONSTANT_P (op1))
1924     optype1 = CNSTOP;
1925   else if (offsettable_memref_p (op1))
1926     optype1 = OFFSOP;
1927   else if (GET_CODE (op1) == MEM)
1928     optype1 = MEMOP;
1929   else
1930     optype1 = RNDOP;
1931
1932   /* Check for the cases that the operand constraints are not
1933      supposed to allow to happen.  Abort if we get one,
1934      because generating code for these cases is painful.  */
1935
1936   if (optype0 == RNDOP || optype1 == RNDOP
1937       || (optype0 == MEM && optype1 == MEM))
1938     abort ();
1939
1940   /* If an operand is an unoffsettable memory ref, find a register
1941      we can increment temporarily to make it refer to the second word.  */
1942
1943   if (optype0 == MEMOP)
1944     addreg0 = find_addr_reg (XEXP (op0, 0));
1945
1946   if (optype1 == MEMOP)
1947     addreg1 = find_addr_reg (XEXP (op1, 0));
1948
1949   /* Ok, we can do one word at a time.
1950      Set up in LATEHALF the operands to use for the
1951      high-numbered (least significant) word and in some cases alter the
1952      operands in OPERANDS to be suitable for the low-numbered word.  */
1953
1954   if (optype0 == REGOP)
1955     latehalf[0] = gen_rtx (REG, SImode, REGNO (op0) + 1);
1956   else if (optype0 == OFFSOP)
1957     latehalf[0] = adj_offsettable_operand (op0, 4);
1958   else
1959     latehalf[0] = op0;
1960
1961   if (optype1 == REGOP)
1962     latehalf[1] = gen_rtx (REG, SImode, REGNO (op1) + 1);
1963   else if (optype1 == OFFSOP)
1964     latehalf[1] = adj_offsettable_operand (op1, 4);
1965   else if (optype1 == CNSTOP)
1966     {
1967       if (TARGET_ARCH64)
1968         {
1969           if (arith_double_operand (op1, DImode))
1970             {
1971               operands[1] = gen_rtx (CONST_INT, VOIDmode,
1972                                      CONST_DOUBLE_LOW (op1));
1973               return "mov %1,%0";
1974             }
1975           else
1976             {
1977               /* The only way to handle CONST_DOUBLEs or other 64 bit
1978                  constants here is to use a temporary, such as is done
1979                  for the V9 DImode sethi insn pattern.  This is not
1980                  a practical solution, so abort if we reach here.
1981                  The md file should always force such constants to
1982                  memory.  */
1983               abort ();
1984             }
1985         }
1986       else
1987         split_double (op1, &operands[1], &latehalf[1]);
1988     }
1989   else
1990     latehalf[1] = op1;
1991
1992   /* Easy case: try moving both words at once.  Check for moving between
1993      an even/odd register pair and a memory location.  */
1994   if ((optype0 == REGOP && optype1 != REGOP && optype1 != CNSTOP
1995        && (TARGET_ARCH64 || (REGNO (op0) & 1) == 0))
1996       || (optype0 != REGOP && optype0 != CNSTOP && optype1 == REGOP
1997           && (TARGET_ARCH64 || (REGNO (op1) & 1) == 0)))
1998     {
1999       register rtx mem,reg;
2000
2001       if (optype0 == REGOP)
2002         mem = op1, reg = op0;
2003       else
2004         mem = op0, reg = op1;
2005
2006       /* In v9, ldd can be used for word aligned addresses, so technically
2007          some of this logic is unneeded.  We still avoid ldd if the address
2008          is obviously unaligned though.  */
2009
2010       if (mem_aligned_8 (mem)
2011           /* If this is a floating point register higher than %f31,
2012              then we *must* use an aligned load, since `ld' will not accept
2013              the register number.  */
2014           || (TARGET_V9 && REGNO (reg) >= 64))
2015         {
2016           if (FP_REG_P (reg) || ! TARGET_ARCH64)
2017             return (mem == op1 ? "ldd %1,%0" : "std %1,%0");
2018           else
2019             return (mem == op1 ? "ldx %1,%0" : "stx %1,%0");
2020         }
2021     }
2022
2023   if (TARGET_ARCH64)
2024     {
2025       if (optype0 == REGOP && optype1 == REGOP)
2026         {
2027           if (FP_REG_P (op0))
2028             return "fmovd %1,%0";
2029           else
2030             return "mov %1,%0";
2031         }
2032     }
2033
2034   /* If the first move would clobber the source of the second one,
2035      do them in the other order.  */
2036
2037   /* Overlapping registers.  */
2038   if (optype0 == REGOP && optype1 == REGOP
2039       && REGNO (op0) == REGNO (latehalf[1]))
2040     {
2041       /* Do that word.  */
2042       output_asm_insn (singlemove_string (latehalf), latehalf);
2043       /* Do low-numbered word.  */
2044       return singlemove_string (operands);
2045     }
2046   /* Loading into a register which overlaps a register used in the address.  */
2047   else if (optype0 == REGOP && optype1 != REGOP
2048            && reg_overlap_mentioned_p (op0, op1))
2049     {
2050       /* If both halves of dest are used in the src memory address,
2051          add the two regs and put them in the low reg (op0).
2052          Then it works to load latehalf first.  */
2053       if (reg_mentioned_p (op0, XEXP (op1, 0))
2054           && reg_mentioned_p (latehalf[0], XEXP (op1, 0)))
2055         {
2056           rtx xops[2];
2057           xops[0] = latehalf[0];
2058           xops[1] = op0;
2059           output_asm_insn ("add %1,%0,%1", xops);
2060           operands[1] = gen_rtx (MEM, DImode, op0);
2061           latehalf[1] = adj_offsettable_operand (operands[1], 4);
2062           addreg1 = 0;
2063           highest_first = 1;
2064         }
2065       /* Only one register in the dest is used in the src memory address,
2066          and this is the first register of the dest, so we want to do
2067          the late half first here also.  */
2068       else if (! reg_mentioned_p (latehalf[0], XEXP (op1, 0)))
2069         highest_first = 1;
2070       /* Only one register in the dest is used in the src memory address,
2071          and this is the second register of the dest, so we want to do
2072          the late half last.  If addreg1 is set, and addreg1 is the same
2073          register as latehalf, then we must suppress the trailing decrement,
2074          because it would clobber the value just loaded.  */
2075       else if (addreg1 && reg_mentioned_p (addreg1, latehalf[0]))
2076         no_addreg1_decrement = 1;
2077     }
2078
2079   /* Normal case: do the two words, low-numbered first.
2080      Overlap case (highest_first set): do high-numbered word first.  */
2081
2082   if (! highest_first)
2083     output_asm_insn (singlemove_string (operands), operands);
2084
2085   /* Make any unoffsettable addresses point at high-numbered word.  */
2086   if (addreg0)
2087     output_asm_insn ("add %0,0x4,%0", &addreg0);
2088   if (addreg1)
2089     output_asm_insn ("add %0,0x4,%0", &addreg1);
2090
2091   /* Do that word.  */
2092   output_asm_insn (singlemove_string (latehalf), latehalf);
2093
2094   /* Undo the adds we just did.  */
2095   if (addreg0)
2096     output_asm_insn ("add %0,-0x4,%0", &addreg0);
2097   if (addreg1 && ! no_addreg1_decrement)
2098     output_asm_insn ("add %0,-0x4,%0", &addreg1);
2099
2100   if (highest_first)
2101     output_asm_insn (singlemove_string (operands), operands);
2102
2103   return "";
2104 }
2105
2106 /* Output assembler code to perform a quadword move insn
2107    with operands OPERANDS.  This is very similar to the preceding
2108    output_move_double function.  */
2109
2110 char *
2111 output_move_quad (operands)
2112      rtx *operands;
2113 {
2114   register rtx op0 = operands[0];
2115   register rtx op1 = operands[1];
2116   register enum optype optype0;
2117   register enum optype optype1;
2118   rtx wordpart[4][2];
2119   rtx addreg0 = 0;
2120   rtx addreg1 = 0;
2121
2122   /* First classify both operands.  */
2123
2124   if (REG_P (op0))
2125     optype0 = REGOP;
2126   else if (offsettable_memref_p (op0))
2127     optype0 = OFFSOP;
2128   else if (GET_CODE (op0) == MEM)
2129     optype0 = MEMOP;
2130   else
2131     optype0 = RNDOP;
2132
2133   if (REG_P (op1))
2134     optype1 = REGOP;
2135   else if (CONSTANT_P (op1))
2136     optype1 = CNSTOP;
2137   else if (offsettable_memref_p (op1))
2138     optype1 = OFFSOP;
2139   else if (GET_CODE (op1) == MEM)
2140     optype1 = MEMOP;
2141   else
2142     optype1 = RNDOP;
2143
2144   /* Check for the cases that the operand constraints are not
2145      supposed to allow to happen.  Abort if we get one,
2146      because generating code for these cases is painful.  */
2147
2148   if (optype0 == RNDOP || optype1 == RNDOP
2149       || (optype0 == MEM && optype1 == MEM))
2150     abort ();
2151
2152   /* If an operand is an unoffsettable memory ref, find a register
2153      we can increment temporarily to make it refer to the later words.  */
2154
2155   if (optype0 == MEMOP)
2156     addreg0 = find_addr_reg (XEXP (op0, 0));
2157
2158   if (optype1 == MEMOP)
2159     addreg1 = find_addr_reg (XEXP (op1, 0));
2160
2161   /* Ok, we can do one word at a time.
2162      Set up in wordpart the operands to use for each word of the arguments.  */
2163
2164   if (optype0 == REGOP)
2165     {
2166       wordpart[0][0] = gen_rtx (REG, word_mode, REGNO (op0) + 0);
2167       wordpart[1][0] = gen_rtx (REG, word_mode, REGNO (op0) + 1);
2168       if (TARGET_ARCH32)
2169         {
2170           wordpart[2][0] = gen_rtx (REG, word_mode, REGNO (op0) + 2);
2171           wordpart[3][0] = gen_rtx (REG, word_mode, REGNO (op0) + 3);
2172         }
2173     }
2174   else if (optype0 == OFFSOP)
2175     {
2176       wordpart[0][0] = adj_offsettable_operand (op0, 0);
2177       if (TARGET_ARCH32)
2178         {
2179           wordpart[1][0] = adj_offsettable_operand (op0, 4);
2180           wordpart[2][0] = adj_offsettable_operand (op0, 8);
2181           wordpart[3][0] = adj_offsettable_operand (op0, 12);
2182         }
2183       else
2184         wordpart[1][0] = adj_offsettable_operand (op0, 8);
2185     }
2186   else
2187     {
2188       wordpart[0][0] = op0;
2189       wordpart[1][0] = op0;
2190       wordpart[2][0] = op0;
2191       wordpart[3][0] = op0;
2192     }
2193
2194   if (optype1 == REGOP)
2195     {
2196       wordpart[0][1] = gen_rtx (REG, word_mode, REGNO (op1) + 0);
2197       wordpart[1][1] = gen_rtx (REG, word_mode, REGNO (op1) + 1);
2198       if (TARGET_ARCH32)
2199         {
2200           wordpart[2][1] = gen_rtx (REG, word_mode, REGNO (op1) + 2);
2201           wordpart[3][1] = gen_rtx (REG, word_mode, REGNO (op1) + 3);
2202         }
2203     }
2204   else if (optype1 == OFFSOP)
2205     {
2206       wordpart[0][1] = adj_offsettable_operand (op1, 0);
2207       if (TARGET_ARCH32)
2208         {
2209           wordpart[1][1] = adj_offsettable_operand (op1, 4);
2210           wordpart[2][1] = adj_offsettable_operand (op1, 8);
2211           wordpart[3][1] = adj_offsettable_operand (op1, 12);
2212         }
2213       else
2214         wordpart[1][1] = adj_offsettable_operand (op1, 8);
2215     }
2216   else if (optype1 == CNSTOP)
2217     {
2218       REAL_VALUE_TYPE r;
2219       long l[4];
2220
2221       /* This only works for TFmode floating point constants.  */
2222       if (GET_CODE (op1) != CONST_DOUBLE || GET_MODE (op1) != TFmode)
2223         abort ();
2224
2225       REAL_VALUE_FROM_CONST_DOUBLE (r, op1);
2226       REAL_VALUE_TO_TARGET_LONG_DOUBLE (r, l);
2227
2228       wordpart[0][1] = GEN_INT (l[0]);
2229       wordpart[1][1] = GEN_INT (l[1]);
2230       wordpart[2][1] = GEN_INT (l[2]);
2231       wordpart[3][1] = GEN_INT (l[3]);
2232     }
2233   else
2234     {
2235       wordpart[0][1] = op1;
2236       wordpart[1][1] = op1;
2237       wordpart[2][1] = op1;
2238       wordpart[3][1] = op1;
2239     }
2240
2241   /* Easy case: try moving the quad as two pairs.  Check for moving between
2242      an even/odd register pair and a memory location.
2243      Also handle new v9 fp regs here.  */
2244   /* ??? Should also handle the case of non-offsettable addresses here.
2245      We can at least do the first pair as a ldd/std, and then do the third
2246      and fourth words individually.  */
2247   if ((optype0 == REGOP && optype1 == OFFSOP && (REGNO (op0) & 1) == 0)
2248       || (optype0 == OFFSOP && optype1 == REGOP && (REGNO (op1) & 1) == 0))
2249     {
2250       rtx mem, reg;
2251
2252       if (optype0 == REGOP)
2253         mem = op1, reg = op0;
2254       else
2255         mem = op0, reg = op1;
2256
2257       if (mem_aligned_8 (mem)
2258           /* If this is a floating point register higher than %f31,
2259              then we *must* use an aligned load, since `ld' will not accept
2260              the register number.  */
2261           || (TARGET_V9 && REGNO (reg) >= SPARC_FIRST_V9_FP_REG))
2262         {
2263           if (TARGET_V9 && FP_REG_P (reg) && TARGET_HARD_QUAD)
2264             {
2265               if ((REGNO (reg) & 3) != 0)
2266                 abort ();
2267               /* ??? Can `mem' have an inappropriate alignment here?  */
2268               return (mem == op1 ? "ldq %1,%0" : "stq %1,%0");
2269             }
2270           operands[2] = adj_offsettable_operand (mem, 8);
2271           /* ??? In arch64 case, shouldn't we use ldd/std for fp regs.  */
2272           if (mem == op1)
2273             return TARGET_ARCH64 ? "ldx %1,%0;ldx %2,%R0" : "ldd %1,%0;ldd %2,%S0";
2274           else
2275             return TARGET_ARCH64 ? "stx %1,%0;stx %R1,%2" : "std %1,%0;std %S1,%2";
2276         }
2277     }
2278
2279   /* If the first move would clobber the source of the second one,
2280      do them in the other order.  */
2281
2282   /* Overlapping registers?  */
2283   if (TARGET_ARCH32)
2284     {
2285       if (optype0 == REGOP && optype1 == REGOP
2286           && (REGNO (op0) == REGNO (wordpart[1][3])
2287               || REGNO (op0) == REGNO (wordpart[1][2])
2288               || REGNO (op0) == REGNO (wordpart[1][1])))
2289         {
2290           /* Do fourth word.  */
2291           output_asm_insn (singlemove_string (wordpart[3]), wordpart[3]);
2292           /* Do the third word.  */
2293           output_asm_insn (singlemove_string (wordpart[2]), wordpart[2]);
2294           /* Do the second word.  */
2295           output_asm_insn (singlemove_string (wordpart[1]), wordpart[1]);
2296           /* Do lowest-numbered word.  */
2297           output_asm_insn (singlemove_string (wordpart[0]), wordpart[0]);
2298           return "";
2299         }
2300     }
2301   else /* TARGET_ARCH64 */
2302     {
2303       if (optype0 == REGOP && optype1 == REGOP
2304           && REGNO (op0) == REGNO (wordpart[1][1]))
2305         {
2306           output_asm_insn ("mov %1,%0", wordpart[1]);
2307           output_asm_insn ("mov %1,%0", wordpart[0]);
2308           return "";
2309         }
2310     }
2311
2312   /* Loading into a register which overlaps a register used in the address.  */
2313   if (optype0 == REGOP && optype1 != REGOP
2314       && reg_overlap_mentioned_p (op0, op1))
2315     {
2316       /* ??? Not implemented yet.  This is a bit complicated, because we
2317          must load which ever part overlaps the address last.  If the address
2318          is a double-reg address, then there are two parts which need to
2319          be done last, which is impossible.  We would need a scratch register
2320          in that case.  */
2321       abort ();
2322     }
2323
2324   /* Normal case: move the words in lowest to highest address order.  */
2325
2326   if (TARGET_ARCH32)
2327     {
2328       output_asm_insn (singlemove_string (wordpart[0]), wordpart[0]);
2329
2330       /* Make any unoffsettable addresses point at the second word.  */
2331       if (addreg0)
2332         output_asm_insn ("add %0,0x4,%0", &addreg0);
2333       if (addreg1)
2334         output_asm_insn ("add %0,0x4,%0", &addreg1);
2335
2336       /* Do the second word.  */
2337       output_asm_insn (singlemove_string (wordpart[1]), wordpart[1]);
2338
2339       /* Make any unoffsettable addresses point at the third word.  */
2340       if (addreg0)
2341         output_asm_insn ("add %0,0x4,%0", &addreg0);
2342       if (addreg1)
2343         output_asm_insn ("add %0,0x4,%0", &addreg1);
2344
2345       /* Do the third word.  */
2346       output_asm_insn (singlemove_string (wordpart[2]), wordpart[2]);
2347
2348       /* Make any unoffsettable addresses point at the fourth word.  */
2349       if (addreg0)
2350         output_asm_insn ("add %0,0x4,%0", &addreg0);
2351       if (addreg1)
2352         output_asm_insn ("add %0,0x4,%0", &addreg1);
2353
2354       /* Do the fourth word.  */
2355       output_asm_insn (singlemove_string (wordpart[3]), wordpart[3]);
2356
2357       /* Undo the adds we just did.  */
2358       if (addreg0)
2359         output_asm_insn ("add %0,-0xc,%0", &addreg0);
2360       if (addreg1)
2361         output_asm_insn ("add %0,-0xc,%0", &addreg1);
2362     }
2363   else /* TARGET_ARCH64 */
2364     {
2365       output_asm_insn (doublemove_string (wordpart[0]), wordpart[0]);
2366
2367       /* Make any unoffsettable addresses point at the second word.  */
2368       if (addreg0)
2369         output_asm_insn ("add %0,0x8,%0", &addreg0);
2370       if (addreg1)
2371         output_asm_insn ("add %0,0x8,%0", &addreg1);
2372
2373       /* Do the second word.  */
2374       output_asm_insn (doublemove_string (wordpart[1]), wordpart[1]);
2375
2376       /* Undo the adds we just did.  */
2377       if (addreg0)
2378         output_asm_insn ("add %0,-0x8,%0", &addreg0);
2379       if (addreg1)
2380         output_asm_insn ("add %0,-0x8,%0", &addreg1);
2381     }
2382
2383   return "";
2384 }
2385 \f
2386 /* Output assembler code to perform a doubleword move insn with operands
2387    OPERANDS, one of which must be a floating point register.  */
2388
2389 char *
2390 output_fp_move_double (operands)
2391      rtx *operands;
2392 {
2393   if (FP_REG_P (operands[0]))
2394     {
2395       if (FP_REG_P (operands[1]))
2396         {
2397           if (TARGET_V9)
2398             return "fmovd %1,%0";
2399           else
2400             return "fmovs %1,%0\n\tfmovs %R1,%R0";
2401         }
2402       else if (GET_CODE (operands[1]) == REG)
2403         abort ();
2404       else
2405         return output_move_double (operands);
2406     }
2407   else if (FP_REG_P (operands[1]))
2408     {
2409       if (GET_CODE (operands[0]) == REG)
2410         abort ();
2411       else
2412         return output_move_double (operands);
2413     }
2414   else abort ();
2415 }
2416
2417 /* Output assembler code to perform a quadword move insn with operands
2418    OPERANDS, one of which must be a floating point register.  */
2419
2420 char *
2421 output_fp_move_quad (operands)
2422      rtx *operands;
2423 {
2424   register rtx op0 = operands[0];
2425   register rtx op1 = operands[1];
2426
2427   if (FP_REG_P (op0))
2428     {
2429       if (FP_REG_P (op1))
2430         {
2431           if (TARGET_V9 && TARGET_HARD_QUAD)
2432             return "fmovq %1,%0";
2433           else if (TARGET_V9)
2434             return "fmovd %1,%0\n\tfmovd %S1,%S0";
2435           else
2436             return "fmovs %1,%0\n\tfmovs %R1,%R0\n\tfmovs %S1,%S0\n\tfmovs %T1,%T0";
2437         }
2438       else if (GET_CODE (op1) == REG)
2439         abort ();
2440       else
2441         return output_move_quad (operands);
2442     }
2443   else if (FP_REG_P (op1))
2444     {
2445       if (GET_CODE (op0) == REG)
2446         abort ();
2447       else
2448         return output_move_quad (operands);
2449     }
2450   else
2451     abort ();
2452 }
2453 \f
2454 /* Return a REG that occurs in ADDR with coefficient 1.
2455    ADDR can be effectively incremented by incrementing REG.  */
2456
2457 static rtx
2458 find_addr_reg (addr)
2459      rtx addr;
2460 {
2461   while (GET_CODE (addr) == PLUS)
2462     {
2463       /* We absolutely can not fudge the frame pointer here, because the
2464          frame pointer must always be 8 byte aligned.  It also confuses
2465          debuggers.  */
2466       if (GET_CODE (XEXP (addr, 0)) == REG
2467           && REGNO (XEXP (addr, 0)) != FRAME_POINTER_REGNUM)
2468         addr = XEXP (addr, 0);
2469       else if (GET_CODE (XEXP (addr, 1)) == REG
2470                && REGNO (XEXP (addr, 1)) != FRAME_POINTER_REGNUM)
2471         addr = XEXP (addr, 1);
2472       else if (CONSTANT_P (XEXP (addr, 0)))
2473         addr = XEXP (addr, 1);
2474       else if (CONSTANT_P (XEXP (addr, 1)))
2475         addr = XEXP (addr, 0);
2476       else
2477         abort ();
2478     }
2479   if (GET_CODE (addr) == REG)
2480     return addr;
2481   abort ();
2482 }
2483
2484 #if 0 /* not currently used */
2485
2486 void
2487 output_sized_memop (opname, mode, signedp)
2488      char *opname;
2489      enum machine_mode mode;
2490      int signedp;
2491 {
2492   static char *ld_size_suffix_u[] = { "ub", "uh", "", "?", "d" };
2493   static char *ld_size_suffix_s[] = { "sb", "sh", "", "?", "d" };
2494   static char *st_size_suffix[] = { "b", "h", "", "?", "d" };
2495   char **opnametab, *modename;
2496
2497   if (opname[0] == 'l')
2498     if (signedp)
2499       opnametab = ld_size_suffix_s;
2500     else
2501       opnametab = ld_size_suffix_u;
2502   else
2503     opnametab = st_size_suffix;
2504   modename = opnametab[GET_MODE_SIZE (mode) >> 1];
2505
2506   fprintf (asm_out_file, "\t%s%s", opname, modename);
2507 }
2508
2509 void
2510 output_move_with_extension (operands)
2511      rtx *operands;
2512 {
2513   if (GET_MODE (operands[2]) == HImode)
2514     output_asm_insn ("sll %2,0x10,%0", operands);
2515   else if (GET_MODE (operands[2]) == QImode)
2516     output_asm_insn ("sll %2,0x18,%0", operands);
2517   else
2518     abort ();
2519 }
2520 #endif /* not currently used */
2521 \f
2522 #if 0
2523 /* ??? These are only used by the movstrsi pattern, but we get better code
2524    in general without that, because emit_block_move can do just as good a
2525    job as this function does when alignment and size are known.  When they
2526    aren't known, a call to strcpy may be faster anyways, because it is
2527    likely to be carefully crafted assembly language code, and below we just
2528    do a byte-wise copy.
2529
2530    Also, emit_block_move expands into multiple read/write RTL insns, which
2531    can then be optimized, whereas our movstrsi pattern can not be optimized
2532    at all.  */
2533
2534 /* Load the address specified by OPERANDS[3] into the register
2535    specified by OPERANDS[0].
2536
2537    OPERANDS[3] may be the result of a sum, hence it could either be:
2538
2539    (1) CONST
2540    (2) REG
2541    (2) REG + CONST_INT
2542    (3) REG + REG + CONST_INT
2543    (4) REG + REG  (special case of 3).
2544
2545    Note that (3) is not a legitimate address.
2546    All cases are handled here.  */
2547
2548 void
2549 output_load_address (operands)
2550      rtx *operands;
2551 {
2552   rtx base, offset;
2553
2554   if (CONSTANT_P (operands[3]))
2555     {
2556       output_asm_insn ("set %3,%0", operands);
2557       return;
2558     }
2559
2560   if (REG_P (operands[3]))
2561     {
2562       if (REGNO (operands[0]) != REGNO (operands[3]))
2563         output_asm_insn ("mov %3,%0", operands);
2564       return;
2565     }
2566
2567   if (GET_CODE (operands[3]) != PLUS)
2568     abort ();
2569
2570   base = XEXP (operands[3], 0);
2571   offset = XEXP (operands[3], 1);
2572
2573   if (GET_CODE (base) == CONST_INT)
2574     {
2575       rtx tmp = base;
2576       base = offset;
2577       offset = tmp;
2578     }
2579
2580   if (GET_CODE (offset) != CONST_INT)
2581     {
2582       /* Operand is (PLUS (REG) (REG)).  */
2583       base = operands[3];
2584       offset = const0_rtx;
2585     }
2586
2587   if (REG_P (base))
2588     {
2589       operands[6] = base;
2590       operands[7] = offset;
2591       if (SMALL_INT (offset))
2592         output_asm_insn ("add %6,%7,%0", operands);
2593       else
2594         output_asm_insn ("set %7,%0\n\tadd %0,%6,%0", operands);
2595     }
2596   else if (GET_CODE (base) == PLUS)
2597     {
2598       operands[6] = XEXP (base, 0);
2599       operands[7] = XEXP (base, 1);
2600       operands[8] = offset;
2601
2602       if (SMALL_INT (offset))
2603         output_asm_insn ("add %6,%7,%0\n\tadd %0,%8,%0", operands);
2604       else
2605         output_asm_insn ("set %8,%0\n\tadd %0,%6,%0\n\tadd %0,%7,%0", operands);
2606     }
2607   else
2608     abort ();
2609 }
2610
2611 /* Output code to place a size count SIZE in register REG.
2612    ALIGN is the size of the unit of transfer.
2613
2614    Because block moves are pipelined, we don't include the
2615    first element in the transfer of SIZE to REG.  */
2616
2617 static void
2618 output_size_for_block_move (size, reg, align)
2619      rtx size, reg;
2620      rtx align;
2621 {
2622   rtx xoperands[3];
2623
2624   xoperands[0] = reg;
2625   xoperands[1] = size;
2626   xoperands[2] = align;
2627   if (GET_CODE (size) == REG)
2628     output_asm_insn ("sub %1,%2,%0", xoperands);
2629   else
2630     {
2631       xoperands[1]
2632         = gen_rtx (CONST_INT, VOIDmode, INTVAL (size) - INTVAL (align));
2633       output_asm_insn ("set %1,%0", xoperands);
2634     }
2635 }
2636
2637 /* Emit code to perform a block move.
2638
2639    OPERANDS[0] is the destination.
2640    OPERANDS[1] is the source.
2641    OPERANDS[2] is the size.
2642    OPERANDS[3] is the alignment safe to use.
2643    OPERANDS[4] is a register we can safely clobber as a temp.  */
2644
2645 char *
2646 output_block_move (operands)
2647      rtx *operands;
2648 {
2649   /* A vector for our computed operands.  Note that load_output_address
2650      makes use of (and can clobber) up to the 8th element of this vector.  */
2651   rtx xoperands[10];
2652   rtx zoperands[10];
2653   static int movstrsi_label = 0;
2654   int i;
2655   rtx temp1 = operands[4];
2656   rtx sizertx = operands[2];
2657   rtx alignrtx = operands[3];
2658   int align = INTVAL (alignrtx);
2659   char label3[30], label5[30];
2660
2661   xoperands[0] = operands[0];
2662   xoperands[1] = operands[1];
2663   xoperands[2] = temp1;
2664
2665   /* We can't move more than this many bytes at a time because we have only
2666      one register, %g1, to move them through.  */
2667   if (align > UNITS_PER_WORD)
2668     {
2669       align = UNITS_PER_WORD;
2670       alignrtx = gen_rtx (CONST_INT, VOIDmode, UNITS_PER_WORD);
2671     }
2672
2673   /* We consider 8 ld/st pairs, for a total of 16 inline insns to be
2674      reasonable here.  (Actually will emit a maximum of 18 inline insns for
2675      the case of size == 31 and align == 4).  */
2676
2677   if (GET_CODE (sizertx) == CONST_INT && (INTVAL (sizertx) / align) <= 8
2678       && memory_address_p (QImode, plus_constant_for_output (xoperands[0],
2679                                                              INTVAL (sizertx)))
2680       && memory_address_p (QImode, plus_constant_for_output (xoperands[1],
2681                                                              INTVAL (sizertx))))
2682     {
2683       int size = INTVAL (sizertx);
2684       int offset = 0;
2685
2686       /* We will store different integers into this particular RTX.  */
2687       xoperands[2] = rtx_alloc (CONST_INT);
2688       PUT_MODE (xoperands[2], VOIDmode);
2689
2690       /* This case is currently not handled.  Abort instead of generating
2691          bad code.  */
2692       if (align > UNITS_PER_WORD)
2693         abort ();
2694
2695       if (TARGET_ARCH64 && align >= 8)
2696         {
2697           for (i = (size >> 3) - 1; i >= 0; i--)
2698             {
2699               INTVAL (xoperands[2]) = (i << 3) + offset;
2700               output_asm_insn ("ldx [%a1+%2],%%g1\n\tstx %%g1,[%a0+%2]",
2701                                xoperands);
2702             }
2703           offset += (size & ~0x7);
2704           size = size & 0x7;
2705           if (size == 0)
2706             return "";
2707         }
2708
2709       if (align >= 4)
2710         {
2711           for (i = (size >> 2) - 1; i >= 0; i--)
2712             {
2713               INTVAL (xoperands[2]) = (i << 2) + offset;
2714               output_asm_insn ("ld [%a1+%2],%%g1\n\tst %%g1,[%a0+%2]",
2715                                xoperands);
2716             }
2717           offset += (size & ~0x3);
2718           size = size & 0x3;
2719           if (size == 0)
2720             return "";
2721         }
2722
2723       if (align >= 2)
2724         {
2725           for (i = (size >> 1) - 1; i >= 0; i--)
2726             {
2727               INTVAL (xoperands[2]) = (i << 1) + offset;
2728               output_asm_insn ("lduh [%a1+%2],%%g1\n\tsth %%g1,[%a0+%2]",
2729                                xoperands);
2730             }
2731           offset += (size & ~0x1);
2732           size = size & 0x1;
2733           if (size == 0)
2734             return "";
2735         }
2736
2737       if (align >= 1)
2738         {
2739           for (i = size - 1; i >= 0; i--)
2740             {
2741               INTVAL (xoperands[2]) = i + offset;
2742               output_asm_insn ("ldub [%a1+%2],%%g1\n\tstb %%g1,[%a0+%2]",
2743                                xoperands);
2744             }
2745           return "";
2746         }
2747
2748       /* We should never reach here.  */
2749       abort ();
2750     }
2751
2752   /* If the size isn't known to be a multiple of the alignment,
2753      we have to do it in smaller pieces.  If we could determine that
2754      the size was a multiple of 2 (or whatever), we could be smarter
2755      about this.  */
2756   if (GET_CODE (sizertx) != CONST_INT)
2757     align = 1;
2758   else
2759     {
2760       int size = INTVAL (sizertx);
2761       while (size % align)
2762         align >>= 1;
2763     }
2764
2765   if (align != INTVAL (alignrtx))
2766     alignrtx = gen_rtx (CONST_INT, VOIDmode, align);
2767
2768   xoperands[3] = gen_rtx (CONST_INT, VOIDmode, movstrsi_label++);
2769   xoperands[4] = gen_rtx (CONST_INT, VOIDmode, align);
2770   xoperands[5] = gen_rtx (CONST_INT, VOIDmode, movstrsi_label++);
2771
2772   ASM_GENERATE_INTERNAL_LABEL (label3, "Lm", INTVAL (xoperands[3]));
2773   ASM_GENERATE_INTERNAL_LABEL (label5, "Lm", INTVAL (xoperands[5]));
2774
2775   /* This is the size of the transfer.  Emit code to decrement the size
2776      value by ALIGN, and store the result in the temp1 register.  */
2777   output_size_for_block_move (sizertx, temp1, alignrtx);
2778
2779   /* Must handle the case when the size is zero or negative, so the first thing
2780      we do is compare the size against zero, and only copy bytes if it is
2781      zero or greater.  Note that we have already subtracted off the alignment
2782      once, so we must copy 1 alignment worth of bytes if the size is zero
2783      here.
2784
2785      The SUN assembler complains about labels in branch delay slots, so we
2786      do this before outputting the load address, so that there will always
2787      be a harmless insn between the branch here and the next label emitted
2788      below.  */
2789
2790   {
2791     char pattern[100];
2792
2793     sprintf (pattern, "cmp %%2,0\n\tbl %s", &label5[1]);
2794     output_asm_insn (pattern, xoperands);
2795   }
2796
2797   zoperands[0] = operands[0];
2798   zoperands[3] = plus_constant_for_output (operands[0], align);
2799   output_load_address (zoperands);
2800
2801   /* ??? This might be much faster if the loops below were preconditioned
2802      and unrolled.
2803
2804      That is, at run time, copy enough bytes one at a time to ensure that the
2805      target and source addresses are aligned to the the largest possible
2806      alignment.  Then use a preconditioned unrolled loop to copy say 16
2807      bytes at a time.  Then copy bytes one at a time until finish the rest.  */
2808
2809   /* Output the first label separately, so that it is spaced properly.  */
2810
2811   ASM_OUTPUT_INTERNAL_LABEL (asm_out_file, "Lm", INTVAL (xoperands[3]));
2812
2813   {
2814     char pattern[200];
2815     register char *ld_suffix = ((align == 1) ? "ub" : (align == 2) ? "uh"
2816                                 : (align == 8 && TARGET_ARCH64) ? "x" : "");
2817     register char *st_suffix = ((align == 1) ? "b" : (align == 2) ? "h"
2818                                 : (align == 8 && TARGET_ARCH64) ? "x" : "");
2819
2820     sprintf (pattern, "ld%s [%%1+%%2],%%%%g1\n\tsubcc %%2,%%4,%%2\n\tbge %s\n\tst%s %%%%g1,[%%0+%%2]\n%s:", ld_suffix, &label3[1], st_suffix, &label5[1]);
2821     output_asm_insn (pattern, xoperands);
2822   }
2823
2824   return "";
2825 }
2826 #endif
2827 \f
2828 /* Output reasonable peephole for set-on-condition-code insns.
2829    Note that these insns assume a particular way of defining
2830    labels.  Therefore, *both* sparc.h and this function must
2831    be changed if a new syntax is needed.    */
2832
2833 char *
2834 output_scc_insn (operands, insn)
2835      rtx operands[];
2836      rtx insn;
2837 {
2838   static char string[100];
2839   rtx label = 0, next = insn;
2840   int need_label = 0;
2841
2842   /* Try doing a jump optimization which jump.c can't do for us
2843      because we did not expose that setcc works by using branches.
2844
2845      If this scc insn is followed by an unconditional branch, then have
2846      the jump insn emitted here jump to that location, instead of to
2847      the end of the scc sequence as usual.  */
2848
2849   do
2850     {
2851       if (GET_CODE (next) == CODE_LABEL)
2852         label = next;
2853       next = NEXT_INSN (next);
2854       if (next == 0)
2855         break;
2856     }
2857   while (GET_CODE (next) == NOTE || GET_CODE (next) == CODE_LABEL);
2858
2859   /* If we are in a sequence, and the following insn is a sequence also,
2860      then just following the current insn's next field will take us to the
2861      first insn of the next sequence, which is the wrong place.  We don't
2862      want to optimize with a branch that has had its delay slot filled.
2863      Avoid this by verifying that NEXT_INSN (PREV_INSN (next)) == next
2864      which fails only if NEXT is such a branch.  */
2865
2866   if (next && GET_CODE (next) == JUMP_INSN && simplejump_p (next)
2867       && (! final_sequence || NEXT_INSN (PREV_INSN (next)) == next))
2868     label = JUMP_LABEL (next);
2869   /* If not optimizing, jump label fields are not set.  To be safe, always
2870      check here to whether label is still zero.  */
2871   if (label == 0)
2872     {
2873       label = gen_label_rtx ();
2874       need_label = 1;
2875     }
2876
2877   LABEL_NUSES (label) += 1;
2878
2879   /* operands[3] is an unused slot.  */
2880   operands[3] = label;
2881
2882   /* If we are in a delay slot, assume it is the delay slot of an fpcc
2883      insn since our type isn't allowed anywhere else.  */
2884
2885   /* ??? Fpcc instructions no longer have delay slots, so this code is
2886      probably obsolete.  */
2887
2888   /* The fastest way to emit code for this is an annulled branch followed
2889      by two move insns.  This will take two cycles if the branch is taken,
2890      and three cycles if the branch is not taken.
2891
2892      However, if we are in the delay slot of another branch, this won't work,
2893      because we can't put a branch in the delay slot of another branch.
2894      The above sequence would effectively take 3 or 4 cycles respectively
2895      since a no op would have be inserted between the two branches.
2896      In this case, we want to emit a move, annulled branch, and then the
2897      second move.  This sequence always takes 3 cycles, and hence is faster
2898      when we are in a branch delay slot.  */
2899
2900   if (final_sequence)
2901     {
2902       strcpy (string, "mov 0,%0\n\t");
2903       strcat (string, output_cbranch (operands[2], 3, 0, 1, 0));
2904       strcat (string, "\n\tmov 1,%0");
2905     }
2906   else
2907     {
2908       strcpy (string, output_cbranch (operands[2], 3, 0, 1, 0));
2909       strcat (string, "\n\tmov 1,%0\n\tmov 0,%0");
2910     }
2911
2912   if (need_label)
2913     strcat (string, "\n%l3:");
2914
2915   return string;
2916 }
2917 \f
2918 /* Vectors to keep interesting information about registers where it can easily
2919    be got.  We use to use the actual mode value as the bit number, but there
2920    are more than 32 modes now.  Instead we use two tables: one indexed by
2921    hard register number, and one indexed by mode.  */
2922
2923 /* The purpose of sparc_mode_class is to shrink the range of modes so that
2924    they all fit (as bit numbers) in a 32 bit word (again).  Each real mode is
2925    mapped into one sparc_mode_class mode.  */
2926
2927 enum sparc_mode_class {
2928   S_MODE, D_MODE, T_MODE, O_MODE,
2929   SF_MODE, DF_MODE, TF_MODE, OF_MODE,
2930   CC_MODE, CCFP_MODE
2931 };
2932
2933 /* Modes for single-word and smaller quantities.  */
2934 #define S_MODES ((1 << (int) S_MODE) | (1 << (int) SF_MODE))
2935
2936 /* Modes for double-word and smaller quantities.  */
2937 #define D_MODES (S_MODES | (1 << (int) D_MODE) | (1 << DF_MODE))
2938
2939 /* Modes for quad-word and smaller quantities.  */
2940 #define T_MODES (D_MODES | (1 << (int) T_MODE) | (1 << (int) TF_MODE))
2941
2942 /* Modes for single-float quantities.  We must allow any single word or
2943    smaller quantity.  This is because the fix/float conversion instructions
2944    take integer inputs/outputs from the float registers.  */
2945 #define SF_MODES (S_MODES)
2946
2947 /* Modes for double-float and smaller quantities.  */
2948 #define DF_MODES (S_MODES | D_MODES)
2949
2950 /* ??? Sparc64 fp regs cannot hold DImode values.  */
2951 #define DF_MODES64 (SF_MODES | DF_MODE /* | D_MODE*/)
2952
2953 /* Modes for double-float only quantities.  */
2954 /* ??? Sparc64 fp regs cannot hold DImode values.
2955    See fix_truncsfdi2.  */
2956 #define DF_ONLY_MODES ((1 << (int) DF_MODE) /*| (1 << (int) D_MODE)*/)
2957
2958 /* Modes for double-float and larger quantities.  */
2959 #define DF_UP_MODES (DF_ONLY_MODES | TF_ONLY_MODES)
2960
2961 /* Modes for quad-float only quantities.  */
2962 #define TF_ONLY_MODES (1 << (int) TF_MODE)
2963
2964 /* Modes for quad-float and smaller quantities.  */
2965 #define TF_MODES (DF_MODES | TF_ONLY_MODES)
2966
2967 /* ??? Sparc64 fp regs cannot hold DImode values.
2968    See fix_truncsfdi2.  */
2969 #define TF_MODES64 (DF_MODES64 | TF_ONLY_MODES)
2970
2971 /* Modes for condition codes.  */
2972 #define CC_MODES (1 << (int) CC_MODE)
2973 #define CCFP_MODES (1 << (int) CCFP_MODE)
2974
2975 /* Value is 1 if register/mode pair is acceptable on sparc.
2976    The funny mixture of D and T modes is because integer operations
2977    do not specially operate on tetra quantities, so non-quad-aligned
2978    registers can hold quadword quantities (except %o4 and %i4 because
2979    they cross fixed registers).  */
2980
2981 /* This points to either the 32 bit or the 64 bit version.  */
2982 int *hard_regno_mode_classes;
2983
2984 static int hard_32bit_mode_classes[] = {
2985   S_MODES, S_MODES, T_MODES, S_MODES, T_MODES, S_MODES, D_MODES, S_MODES,
2986   T_MODES, S_MODES, T_MODES, S_MODES, D_MODES, S_MODES, D_MODES, S_MODES,
2987   T_MODES, S_MODES, T_MODES, S_MODES, T_MODES, S_MODES, D_MODES, S_MODES,
2988   T_MODES, S_MODES, T_MODES, S_MODES, D_MODES, S_MODES, D_MODES, S_MODES,
2989
2990   TF_MODES, SF_MODES, DF_MODES, SF_MODES, TF_MODES, SF_MODES, DF_MODES, SF_MODES,
2991   TF_MODES, SF_MODES, DF_MODES, SF_MODES, TF_MODES, SF_MODES, DF_MODES, SF_MODES,
2992   TF_MODES, SF_MODES, DF_MODES, SF_MODES, TF_MODES, SF_MODES, DF_MODES, SF_MODES,
2993   TF_MODES, SF_MODES, DF_MODES, SF_MODES, TF_MODES, SF_MODES, DF_MODES, SF_MODES,
2994
2995   /* FP regs f32 to f63.  Only the even numbered registers actually exist,
2996      and none can hold SFmode/SImode values.  */
2997   DF_UP_MODES, 0, DF_ONLY_MODES, 0, DF_UP_MODES, 0, DF_ONLY_MODES, 0,
2998   DF_UP_MODES, 0, DF_ONLY_MODES, 0, DF_UP_MODES, 0, DF_ONLY_MODES, 0,
2999   DF_UP_MODES, 0, DF_ONLY_MODES, 0, DF_UP_MODES, 0, DF_ONLY_MODES, 0,
3000   DF_UP_MODES, 0, DF_ONLY_MODES, 0, DF_UP_MODES, 0, DF_ONLY_MODES, 0,
3001
3002   /* %fcc[0123] */
3003   CCFP_MODES, CCFP_MODES, CCFP_MODES, CCFP_MODES,
3004
3005   /* %icc */
3006   CC_MODES
3007 };
3008
3009 static int hard_64bit_mode_classes[] = {
3010   D_MODES, D_MODES, T_MODES, D_MODES, T_MODES, D_MODES, T_MODES, D_MODES,
3011   T_MODES, D_MODES, T_MODES, D_MODES, T_MODES, D_MODES, T_MODES, D_MODES,
3012   T_MODES, D_MODES, T_MODES, D_MODES, T_MODES, D_MODES, T_MODES, D_MODES,
3013   T_MODES, D_MODES, T_MODES, D_MODES, T_MODES, D_MODES, T_MODES, D_MODES,
3014
3015   TF_MODES64, SF_MODES, DF_MODES64, SF_MODES, TF_MODES64, SF_MODES, DF_MODES64, SF_MODES,
3016   TF_MODES64, SF_MODES, DF_MODES64, SF_MODES, TF_MODES64, SF_MODES, DF_MODES64, SF_MODES,
3017   TF_MODES64, SF_MODES, DF_MODES64, SF_MODES, TF_MODES64, SF_MODES, DF_MODES64, SF_MODES,
3018   TF_MODES64, SF_MODES, DF_MODES64, SF_MODES, TF_MODES64, SF_MODES, DF_MODES64, SF_MODES,
3019
3020   /* FP regs f32 to f63.  Only the even numbered registers actually exist,
3021      and none can hold SFmode/SImode values.  */
3022   DF_UP_MODES, 0, DF_ONLY_MODES, 0, DF_UP_MODES, 0, DF_ONLY_MODES, 0,
3023   DF_UP_MODES, 0, DF_ONLY_MODES, 0, DF_UP_MODES, 0, DF_ONLY_MODES, 0,
3024   DF_UP_MODES, 0, DF_ONLY_MODES, 0, DF_UP_MODES, 0, DF_ONLY_MODES, 0,
3025   DF_UP_MODES, 0, DF_ONLY_MODES, 0, DF_UP_MODES, 0, DF_ONLY_MODES, 0,
3026
3027   /* %fcc[0123] */
3028   CCFP_MODES, CCFP_MODES, CCFP_MODES, CCFP_MODES,
3029
3030   /* %icc */
3031   CC_MODES
3032 };
3033
3034 int sparc_mode_class [NUM_MACHINE_MODES];
3035
3036 enum reg_class sparc_regno_reg_class[FIRST_PSEUDO_REGISTER];
3037
3038 static void
3039 sparc_init_modes ()
3040 {
3041   int i;
3042
3043   for (i = 0; i < NUM_MACHINE_MODES; i++)
3044     {
3045       switch (GET_MODE_CLASS (i))
3046         {
3047         case MODE_INT:
3048         case MODE_PARTIAL_INT:
3049         case MODE_COMPLEX_INT:
3050           if (GET_MODE_SIZE (i) <= 4)
3051             sparc_mode_class[i] = 1 << (int) S_MODE;
3052           else if (GET_MODE_SIZE (i) == 8)
3053             sparc_mode_class[i] = 1 << (int) D_MODE;
3054           else if (GET_MODE_SIZE (i) == 16)
3055             sparc_mode_class[i] = 1 << (int) T_MODE;
3056           else if (GET_MODE_SIZE (i) == 32)
3057             sparc_mode_class[i] = 1 << (int) O_MODE;
3058           else
3059             sparc_mode_class[i] = 0;
3060           break;
3061         case MODE_FLOAT:
3062         case MODE_COMPLEX_FLOAT:
3063           if (GET_MODE_SIZE (i) <= 4)
3064             sparc_mode_class[i] = 1 << (int) SF_MODE;
3065           else if (GET_MODE_SIZE (i) == 8)
3066             sparc_mode_class[i] = 1 << (int) DF_MODE;
3067           else if (GET_MODE_SIZE (i) == 16)
3068             sparc_mode_class[i] = 1 << (int) TF_MODE;
3069           else if (GET_MODE_SIZE (i) == 32)
3070             sparc_mode_class[i] = 1 << (int) OF_MODE;
3071           else
3072             sparc_mode_class[i] = 0;
3073           break;
3074         case MODE_CC:
3075         default:
3076           /* mode_class hasn't been initialized yet for EXTRA_CC_MODES, so
3077              we must explicitly check for them here.  */
3078           if (i == (int) CCFPmode || i == (int) CCFPEmode)
3079             sparc_mode_class[i] = 1 << (int) CCFP_MODE;
3080           else if (i == (int) CCmode || i == (int) CC_NOOVmode
3081                    || i == (int) CCXmode || i == (int) CCX_NOOVmode)
3082             sparc_mode_class[i] = 1 << (int) CC_MODE;
3083           else
3084             sparc_mode_class[i] = 0;
3085           break;
3086         }
3087     }
3088
3089   if (TARGET_ARCH64)
3090     hard_regno_mode_classes = hard_64bit_mode_classes;
3091   else
3092     hard_regno_mode_classes = hard_32bit_mode_classes;
3093
3094   /* Initialize the array used by REGNO_REG_CLASS.  */
3095   for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
3096     {
3097       if (i < 32)
3098         sparc_regno_reg_class[i] = GENERAL_REGS;
3099       else if (i < 64)
3100         sparc_regno_reg_class[i] = FP_REGS;
3101       else if (i < 96)
3102         sparc_regno_reg_class[i] = EXTRA_FP_REGS;
3103       else if (i < 100)
3104         sparc_regno_reg_class[i] = FPCC_REGS;
3105       else
3106         sparc_regno_reg_class[i] = NO_REGS;
3107     }
3108 }
3109 \f
3110 /* Save non call used registers from LOW to HIGH at BASE+OFFSET.
3111    N_REGS is the number of 4-byte regs saved thus far.  This applies even to
3112    v9 int regs as it simplifies the code.  */
3113
3114 static int
3115 save_regs (file, low, high, base, offset, n_regs, real_offset)
3116      FILE *file;
3117      int low, high;
3118      char *base;
3119      int offset;
3120      int n_regs;
3121      int real_offset;
3122 {
3123   int i;
3124
3125   if (TARGET_ARCH64 && high <= 32)
3126     {
3127       for (i = low; i < high; i++)
3128         {
3129           if (regs_ever_live[i] && ! call_used_regs[i])
3130             {
3131               fprintf (file, "\tstx %s,[%s+%d]\n",
3132                        reg_names[i], base, offset + 4 * n_regs);
3133               if (dwarf2out_do_frame ())
3134                 dwarf2out_reg_save ("", i, real_offset + 4 * n_regs);
3135               n_regs += 2;
3136             }
3137         }
3138     }
3139   else
3140     {
3141       for (i = low; i < high; i += 2)
3142         {
3143           if (regs_ever_live[i] && ! call_used_regs[i])
3144             if (regs_ever_live[i+1] && ! call_used_regs[i+1])
3145               {
3146                 fprintf (file, "\tstd %s,[%s+%d]\n",
3147                          reg_names[i], base, offset + 4 * n_regs);
3148                 if (dwarf2out_do_frame ())
3149                   {
3150                     char *l = dwarf2out_cfi_label ();
3151                     dwarf2out_reg_save (l, i, real_offset + 4 * n_regs);
3152                     dwarf2out_reg_save (l, i+1, real_offset + 4 * n_regs + 4);
3153                   }
3154                 n_regs += 2;
3155               }
3156             else
3157               {
3158                 fprintf (file, "\tst %s,[%s+%d]\n",
3159                          reg_names[i], base, offset + 4 * n_regs);
3160                 if (dwarf2out_do_frame ())
3161                   dwarf2out_reg_save ("", i, real_offset + 4 * n_regs);
3162                 n_regs += 2;
3163               }
3164           else if (regs_ever_live[i+1] && ! call_used_regs[i+1])
3165             {
3166               fprintf (file, "\tst %s,[%s+%d]\n",
3167                        reg_names[i+1], base, offset + 4 * n_regs + 4);
3168               if (dwarf2out_do_frame ())
3169                 dwarf2out_reg_save ("", i + 1, real_offset + 4 * n_regs + 4);
3170               n_regs += 2;
3171             }
3172         }
3173     }
3174   return n_regs;
3175 }
3176
3177 /* Restore non call used registers from LOW to HIGH at BASE+OFFSET.
3178
3179    N_REGS is the number of 4-byte regs saved thus far.  This applies even to
3180    v9 int regs as it simplifies the code.  */
3181
3182 static int
3183 restore_regs (file, low, high, base, offset, n_regs)
3184      FILE *file;
3185      int low, high;
3186      char *base;
3187      int offset;
3188      int n_regs;
3189 {
3190   int i;
3191
3192   if (TARGET_ARCH64 && high <= 32)
3193     {
3194       for (i = low; i < high; i++)
3195         {
3196           if (regs_ever_live[i] && ! call_used_regs[i])
3197             fprintf (file, "\tldx [%s+%d], %s\n",
3198               base, offset + 4 * n_regs, reg_names[i]),
3199             n_regs += 2;
3200         }
3201     }
3202   else
3203     {
3204       for (i = low; i < high; i += 2)
3205         {
3206           if (regs_ever_live[i] && ! call_used_regs[i])
3207             if (regs_ever_live[i+1] && ! call_used_regs[i+1])
3208               fprintf (file, "\tldd [%s+%d], %s\n",
3209                        base, offset + 4 * n_regs, reg_names[i]),
3210               n_regs += 2;
3211             else
3212               fprintf (file, "\tld [%s+%d],%s\n",
3213                        base, offset + 4 * n_regs, reg_names[i]),
3214               n_regs += 2;
3215           else if (regs_ever_live[i+1] && ! call_used_regs[i+1])
3216             fprintf (file, "\tld [%s+%d],%s\n",
3217                      base, offset + 4 * n_regs + 4, reg_names[i+1]),
3218             n_regs += 2;
3219         }
3220     }
3221   return n_regs;
3222 }
3223
3224 /* Static variables we want to share between prologue and epilogue.  */
3225
3226 /* Number of live general or floating point registers needed to be saved
3227    (as 4-byte quantities).  This is only done if TARGET_EPILOGUE.  */
3228 static int num_gfregs;
3229
3230 /* Compute the frame size required by the function.  This function is called
3231    during the reload pass and also by output_function_prologue().  */
3232
3233 int
3234 compute_frame_size (size, leaf_function)
3235      int size;
3236      int leaf_function;
3237 {
3238   int n_regs = 0, i;
3239   int outgoing_args_size = (current_function_outgoing_args_size
3240                             + REG_PARM_STACK_SPACE (current_function_decl));
3241
3242   if (TARGET_EPILOGUE)
3243     {
3244       /* N_REGS is the number of 4-byte regs saved thus far.  This applies
3245          even to v9 int regs to be consistent with save_regs/restore_regs.  */
3246
3247       if (TARGET_ARCH64)
3248         {
3249           for (i = 0; i < 8; i++)
3250             if (regs_ever_live[i] && ! call_used_regs[i])
3251               n_regs += 2;
3252         }
3253       else
3254         {
3255           for (i = 0; i < 8; i += 2)
3256             if ((regs_ever_live[i] && ! call_used_regs[i])
3257                 || (regs_ever_live[i+1] && ! call_used_regs[i+1]))
3258               n_regs += 2;
3259         }
3260
3261       for (i = 32; i < (TARGET_V9 ? 96 : 64); i += 2)
3262         if ((regs_ever_live[i] && ! call_used_regs[i])
3263             || (regs_ever_live[i+1] && ! call_used_regs[i+1]))
3264           n_regs += 2;
3265     }
3266
3267   /* Set up values for use in `function_epilogue'.  */
3268   num_gfregs = n_regs;
3269
3270   if (leaf_function && n_regs == 0
3271       && size == 0 && current_function_outgoing_args_size == 0)
3272     {
3273       actual_fsize = apparent_fsize = 0;
3274     }
3275   else
3276     {
3277       /* We subtract STARTING_FRAME_OFFSET, remember it's negative.
3278          The stack bias (if any) is taken out to undo its effects.  */
3279       apparent_fsize = (size - STARTING_FRAME_OFFSET + SPARC_STACK_BIAS + 7) & -8;
3280       apparent_fsize += n_regs * 4;
3281       actual_fsize = apparent_fsize + ((outgoing_args_size + 7) & -8);
3282     }
3283
3284   /* Make sure nothing can clobber our register windows.
3285      If a SAVE must be done, or there is a stack-local variable,
3286      the register window area must be allocated.
3287      ??? For v8 we apparently need an additional 8 bytes of reserved space.  */
3288   if (leaf_function == 0 || size > 0)
3289     actual_fsize += (16 * UNITS_PER_WORD) + (TARGET_ARCH64 ? 0 : 8);
3290
3291   return SPARC_STACK_ALIGN (actual_fsize);
3292 }
3293
3294 /* Build a (32 bit) big number in a register.  */
3295 /* ??? We may be able to use the set macro here too.  */
3296
3297 static void
3298 build_big_number (file, num, reg)
3299      FILE *file;
3300      int num;
3301      char *reg;
3302 {
3303   if (num >= 0 || ! TARGET_ARCH64)
3304     {
3305       fprintf (file, "\tsethi %%hi(%d),%s\n", num, reg);
3306       if ((num & 0x3ff) != 0)
3307         fprintf (file, "\tor %s,%%lo(%d),%s\n", reg, num, reg);
3308     }
3309   else /* num < 0 && TARGET_ARCH64 */
3310     {
3311       /* Sethi does not sign extend, so we must use a little trickery
3312          to use it for negative numbers.  Invert the constant before
3313          loading it in, then use xor immediate to invert the loaded bits
3314          (along with the upper 32 bits) to the desired constant.  This
3315          works because the sethi and immediate fields overlap.  */
3316       int asize = num;
3317       int inv = ~asize;
3318       int low = -0x400 + (asize & 0x3FF);
3319
3320       fprintf (file, "\tsethi %%hi(%d),%s\n\txor %s,%d,%s\n",
3321                inv, reg, reg, low, reg);
3322     }
3323 }
3324
3325 /* Output code for the function prologue.  */
3326
3327 void
3328 output_function_prologue (file, size, leaf_function)
3329      FILE *file;
3330      int size;
3331      int leaf_function;
3332 {
3333   /* Need to use actual_fsize, since we are also allocating
3334      space for our callee (and our own register save area).  */
3335   actual_fsize = compute_frame_size (size, leaf_function);
3336
3337   if (leaf_function)
3338     {
3339       frame_base_name = "%sp";
3340       frame_base_offset = actual_fsize + SPARC_STACK_BIAS;
3341     }
3342   else
3343     {
3344       frame_base_name = "%fp";
3345       frame_base_offset = SPARC_STACK_BIAS;
3346     }
3347
3348   /* This is only for the human reader.  */
3349   fprintf (file, "\t%s#PROLOGUE# 0\n", ASM_COMMENT_START);
3350
3351   if (actual_fsize == 0)
3352     /* do nothing.  */ ;
3353   else if (! leaf_function && ! TARGET_BROKEN_SAVERESTORE)
3354     {
3355       if (actual_fsize <= 4096)
3356         fprintf (file, "\tsave %%sp,-%d,%%sp\n", actual_fsize);
3357       else if (actual_fsize <= 8192)
3358         {
3359           fprintf (file, "\tsave %%sp,-4096,%%sp\n");
3360           fprintf (file, "\tadd %%sp,-%d,%%sp\n", actual_fsize - 4096);
3361         }
3362       else
3363         {
3364           build_big_number (file, -actual_fsize, "%g1");
3365           fprintf (file, "\tsave %%sp,%%g1,%%sp\n");
3366         }
3367     }
3368   else if (! leaf_function && TARGET_BROKEN_SAVERESTORE)
3369     {
3370       /* We assume the environment will properly handle or otherwise avoid
3371          trouble associated with an interrupt occurring after the `save' or
3372          trap occurring during it.  */
3373       fprintf (file, "\tsave\n");
3374
3375       if (actual_fsize <= 4096)
3376         fprintf (file, "\tadd %%fp,-%d,%%sp\n", actual_fsize);
3377       else if (actual_fsize <= 8192)
3378         {
3379           fprintf (file, "\tadd %%fp,-4096,%%sp\n");
3380           fprintf (file, "\tadd %%fp,-%d,%%sp\n", actual_fsize - 4096);
3381         }
3382       else
3383         {
3384           build_big_number (file, -actual_fsize, "%g1");
3385           fprintf (file, "\tadd %%fp,%%g1,%%sp\n");
3386         }
3387     }
3388   else /* leaf function */
3389     {
3390       if (actual_fsize <= 4096)
3391         fprintf (file, "\tadd %%sp,-%d,%%sp\n", actual_fsize);
3392       else if (actual_fsize <= 8192)
3393         {
3394           fprintf (file, "\tadd %%sp,-4096,%%sp\n");
3395           fprintf (file, "\tadd %%sp,-%d,%%sp\n", actual_fsize - 4096);
3396         }
3397       else
3398         {
3399           build_big_number (file, -actual_fsize, "%g1");
3400           fprintf (file, "\tadd %%sp,%%g1,%%sp\n");
3401         }
3402     }
3403
3404   if (dwarf2out_do_frame () && actual_fsize)
3405     {
3406       char *label = dwarf2out_cfi_label ();
3407
3408       /* The canonical frame address refers to the top of the frame.  */
3409       dwarf2out_def_cfa (label, (leaf_function ? STACK_POINTER_REGNUM
3410                                  : FRAME_POINTER_REGNUM),
3411                          frame_base_offset);
3412
3413       if (! leaf_function)
3414         {
3415           /* Note the register window save.  This tells the unwinder that
3416              it needs to restore the window registers from the previous
3417              frame's window save area at 0(cfa).  */
3418           dwarf2out_window_save (label);
3419
3420           /* The return address (-8) is now in %i7.  */
3421           dwarf2out_return_reg (label, 31);
3422         }
3423     }
3424
3425   /* If doing anything with PIC, do it now.  */
3426   if (! flag_pic)
3427     fprintf (file, "\t%s#PROLOGUE# 1\n", ASM_COMMENT_START);
3428
3429   /* Call saved registers are saved just above the outgoing argument area.  */
3430   if (num_gfregs)
3431     {
3432       int offset, real_offset, n_regs;
3433       char *base;
3434
3435       real_offset = -apparent_fsize;
3436       offset = -apparent_fsize + frame_base_offset;
3437       if (offset < -4096 || offset + num_gfregs * 4 > 4096)
3438         {
3439           /* ??? This might be optimized a little as %g1 might already have a
3440              value close enough that a single add insn will do.  */
3441           /* ??? Although, all of this is probably only a temporary fix
3442              because if %g1 can hold a function result, then
3443              output_function_epilogue will lose (the result will get
3444              clobbered).  */
3445           build_big_number (file, offset, "%g1");
3446           fprintf (file, "\tadd %s,%%g1,%%g1\n", frame_base_name);
3447           base = "%g1";
3448           offset = 0;
3449         }
3450       else
3451         {
3452           base = frame_base_name;
3453         }
3454
3455       if (TARGET_EPILOGUE && ! leaf_function)
3456         /* ??? Originally saved regs 0-15 here.  */
3457         n_regs = save_regs (file, 0, 8, base, offset, 0, real_offset);
3458       else if (leaf_function)
3459         /* ??? Originally saved regs 0-31 here.  */
3460         n_regs = save_regs (file, 0, 8, base, offset, 0, real_offset);
3461       if (TARGET_EPILOGUE)
3462         save_regs (file, 32, TARGET_V9 ? 96 : 64, base, offset, n_regs,
3463                    real_offset);
3464     }
3465
3466   leaf_label = 0;
3467   if (leaf_function && actual_fsize != 0)
3468     {
3469       /* warning ("leaf procedure with frame size %d", actual_fsize); */
3470       if (! TARGET_EPILOGUE)
3471         leaf_label = gen_label_rtx ();
3472     }
3473 }
3474
3475 /* Output code for the function epilogue.  */
3476
3477 void
3478 output_function_epilogue (file, size, leaf_function)
3479      FILE *file;
3480      int size;
3481      int leaf_function;
3482 {
3483   char *ret;
3484
3485   if (leaf_label)
3486     {
3487       emit_label_after (leaf_label, get_last_insn ());
3488       final_scan_insn (get_last_insn (), file, 0, 0, 1);
3489     }
3490
3491 #ifdef FUNCTION_BLOCK_PROFILER_EXIT
3492   else if (profile_block_flag == 2)
3493     {
3494       FUNCTION_BLOCK_PROFILER_EXIT(file);
3495     }
3496 #endif
3497
3498   /* Restore any call saved registers.  */
3499   if (num_gfregs)
3500     {
3501       int offset, n_regs;
3502       char *base;
3503
3504       offset = -apparent_fsize + frame_base_offset;
3505       if (offset < -4096 || offset + num_gfregs * 4 > 4096 - 8 /*double*/)
3506         {
3507           build_big_number (file, offset, "%g1");
3508           fprintf (file, "\tadd %s,%%g1,%%g1\n", frame_base_name);
3509           base = "%g1";
3510           offset = 0;
3511         }
3512       else
3513         {
3514           base = frame_base_name;
3515         }
3516
3517       if (TARGET_EPILOGUE && ! leaf_function)
3518         /* ??? Originally saved regs 0-15 here.  */
3519         n_regs = restore_regs (file, 0, 8, base, offset, 0);
3520       else if (leaf_function)
3521         /* ??? Originally saved regs 0-31 here.  */
3522         n_regs = restore_regs (file, 0, 8, base, offset, 0);
3523       if (TARGET_EPILOGUE)
3524         restore_regs (file, 32, TARGET_V9 ? 96 : 64, base, offset, n_regs);
3525     }
3526
3527   /* Work out how to skip the caller's unimp instruction if required.  */
3528   if (leaf_function)
3529     ret = (SKIP_CALLERS_UNIMP_P ? "jmp %o7+12" : "retl");
3530   else
3531     ret = (SKIP_CALLERS_UNIMP_P ? "jmp %i7+12" : "ret");
3532
3533   if (TARGET_EPILOGUE || leaf_label)
3534     {
3535       int old_target_epilogue = TARGET_EPILOGUE;
3536       target_flags &= ~old_target_epilogue;
3537
3538       if (! leaf_function)
3539         {
3540           /* If we wound up with things in our delay slot, flush them here.  */
3541           if (current_function_epilogue_delay_list)
3542             {
3543               rtx insn = emit_jump_insn_after (gen_rtx (RETURN, VOIDmode),
3544                                                get_last_insn ());
3545               PATTERN (insn) = gen_rtx (PARALLEL, VOIDmode,
3546                                         gen_rtvec (2,
3547                                                    PATTERN (XEXP (current_function_epilogue_delay_list, 0)),
3548                                                    PATTERN (insn)));
3549               final_scan_insn (insn, file, 1, 0, 1);
3550             }
3551           else
3552             fprintf (file, "\t%s\n\trestore\n", ret);
3553         }
3554       /* All of the following cases are for leaf functions.  */
3555       else if (current_function_epilogue_delay_list)
3556         {
3557           /* eligible_for_epilogue_delay_slot ensures that if this is a
3558              leaf function, then we will only have insn in the delay slot
3559              if the frame size is zero, thus no adjust for the stack is
3560              needed here.  */
3561           if (actual_fsize != 0)
3562             abort ();
3563           fprintf (file, "\t%s\n", ret);
3564           final_scan_insn (XEXP (current_function_epilogue_delay_list, 0),
3565                            file, 1, 0, 1);
3566         }
3567       /* Output 'nop' instead of 'sub %sp,-0,%sp' when no frame, so as to
3568          avoid generating confusing assembly language output.  */
3569       else if (actual_fsize == 0)
3570         fprintf (file, "\t%s\n\tnop\n", ret);
3571       else if (actual_fsize <= 4096)
3572         fprintf (file, "\t%s\n\tsub %%sp,-%d,%%sp\n", ret, actual_fsize);
3573       else if (actual_fsize <= 8192)
3574         fprintf (file, "\tsub %%sp,-4096,%%sp\n\t%s\n\tsub %%sp,-%d,%%sp\n",
3575                  ret, actual_fsize - 4096);
3576       else if ((actual_fsize & 0x3ff) == 0)
3577         fprintf (file, "\tsethi %%hi(%d),%%g1\n\t%s\n\tadd %%sp,%%g1,%%sp\n",
3578                  actual_fsize, ret);
3579       else
3580         fprintf (file, "\tsethi %%hi(%d),%%g1\n\tor %%g1,%%lo(%d),%%g1\n\t%s\n\tadd %%sp,%%g1,%%sp\n",
3581                  actual_fsize, actual_fsize, ret);
3582       target_flags |= old_target_epilogue;
3583     }
3584 }
3585 \f
3586 /* Functions for handling argument passing.
3587
3588    For v8 the first six args are normally in registers and the rest are
3589    pushed.  Any arg that starts within the first 6 words is at least
3590    partially passed in a register unless its data type forbids.
3591
3592    For v9, the argument registers are laid out as an array of 16 elements
3593    and arguments are added sequentially.  The first 6 int args and up to the
3594    first 16 fp args (depending on size) are passed in regs.
3595
3596    Slot    Stack   Integral   Float   Float in structure   Double   Long Double
3597    ----    -----   --------   -----   ------------------   ------   -----------
3598     15   [SP+248]              %f31       %f30,%f31         %d30
3599     14   [SP+240]              %f29       %f28,%f29         %d28       %q28
3600     13   [SP+232]              %f27       %f26,%f27         %d26
3601     12   [SP+224]              %f25       %f24,%f25         %d24       %q24
3602     11   [SP+216]              %f23       %f22,%f23         %d22
3603     10   [SP+208]              %f21       %f20,%f21         %d20       %q20
3604      9   [SP+200]              %f19       %f18,%f19         %d18
3605      8   [SP+192]              %f17       %f16,%f17         %d16       %q16
3606      7   [SP+184]              %f15       %f14,%f15         %d14
3607      6   [SP+176]              %f13       %f12,%f13         %d12       %q12
3608      5   [SP+168]     %o5      %f11       %f10,%f11         %d10
3609      4   [SP+160]     %o4       %f9        %f8,%f9           %d8        %q8
3610      3   [SP+152]     %o3       %f7        %f6,%f7           %d6
3611      2   [SP+144]     %o2       %f5        %f4,%f5           %d4        %q4
3612      1   [SP+136]     %o1       %f3        %f2,%f3           %d2
3613      0   [SP+128]     %o0       %f1        %f0,%f1           %d0        %q0
3614
3615    Here SP = %sp if -mno-stack-bias or %sp+stack_bias otherwise.
3616
3617    Integral arguments are always passed as 64 bit quantities appropriately
3618    extended.
3619
3620    Passing of floating point values is handled as follows.
3621    If a prototype is in scope:
3622      If the value is in a named argument (i.e. not a stdarg function or a
3623      value not part of the `...') then the value is passed in the appropriate
3624      fp reg.
3625      If the value is part of the `...' and is passed in one of the first 6
3626      slots then the value is passed in the appropriate int reg.
3627      If the value is part of the `...' and is not passed in one of the first 6
3628      slots then the value is passed in memory.
3629    If a prototype is not in scope:
3630      If the value is one of the first 6 arguments the value is passed in the
3631      appropriate integer reg and the appropriate fp reg.
3632      If the value is not one of the first 6 arguments the value is passed in
3633      the appropriate fp reg and in memory.
3634    */
3635
3636 /* Maximum number of int regs for args.  */
3637 #define SPARC_INT_ARG_MAX 6
3638 /* Maximum number of fp regs for args.  */
3639 #define SPARC_FP_ARG_MAX 16
3640
3641 #define ROUND_ADVANCE(SIZE) (((SIZE) + UNITS_PER_WORD - 1) / UNITS_PER_WORD)
3642
3643 /* Handle the INIT_CUMULATIVE_ARGS macro.
3644    Initialize a variable CUM of type CUMULATIVE_ARGS
3645    for a call to a function whose data type is FNTYPE.
3646    For a library call, FNTYPE is 0.  */
3647
3648 void
3649 init_cumulative_args (cum, fntype, libname, indirect)
3650      CUMULATIVE_ARGS *cum;
3651      tree fntype, libname;
3652      int indirect;
3653 {
3654   cum->words = 0;
3655   cum->prototype_p = fntype && TYPE_ARG_TYPES (fntype);
3656   cum->libcall_p = fntype == 0;
3657 }
3658
3659 /* Compute the slot number to pass an argument in.
3660    Returns the slot number or -1 if passing on the stack.
3661
3662    CUM is a variable of type CUMULATIVE_ARGS which gives info about
3663     the preceding args and about the function being called.
3664    MODE is the argument's machine mode.
3665    TYPE is the data type of the argument (as a tree).
3666     This is null for libcalls where that information may
3667     not be available.
3668    NAMED is nonzero if this argument is a named parameter
3669     (otherwise it is an extra parameter matching an ellipsis).
3670    INCOMING_P is zero for FUNCTION_ARG, nonzero for FUNCTION_INCOMING_ARG.
3671    *PREGNO records the register number to use if scalar type.
3672    *PPADDING records the amount of padding needed in words.  */
3673
3674 static int
3675 function_arg_slotno (cum, mode, type, named, incoming_p, pregno, ppadding)
3676      const CUMULATIVE_ARGS *cum;
3677      enum machine_mode mode;
3678      tree type;
3679      int named;
3680      int incoming_p;
3681      int *pregno;
3682      int *ppadding;
3683 {
3684   int regbase = (incoming_p
3685                  ? SPARC_INCOMING_INT_ARG_FIRST
3686                  : SPARC_OUTGOING_INT_ARG_FIRST);
3687   int slotno = cum->words;
3688   int regno;
3689
3690   *ppadding = 0;
3691
3692   if (type != 0 && TREE_ADDRESSABLE (type))
3693     return -1;
3694   if (TARGET_ARCH32
3695       && type != 0 && mode == BLKmode
3696       && TYPE_ALIGN (type) % PARM_BOUNDARY != 0)
3697     return -1;
3698
3699   switch (mode)
3700     {
3701     case VOIDmode :
3702       /* MODE is VOIDmode when generating the actual call.
3703          See emit_call_1.  */
3704       return -1;
3705
3706     case QImode : case CQImode :
3707     case HImode : case CHImode :
3708     case SImode : case CSImode :
3709     case DImode : case CDImode :
3710       if (slotno >= SPARC_INT_ARG_MAX)
3711         return -1;
3712       regno = regbase + slotno;
3713       break;
3714
3715     case SFmode : case SCmode :
3716     case DFmode : case DCmode :
3717     case TFmode : case TCmode :
3718       if (TARGET_ARCH32)
3719         {
3720           if (slotno >= SPARC_INT_ARG_MAX)
3721             return -1;
3722           regno = regbase + slotno;
3723         }
3724       else
3725         {
3726           if ((mode == TFmode || mode == TCmode)
3727               && (slotno & 1) != 0)
3728             slotno++, *ppadding = 1;
3729           if (TARGET_FPU && named)
3730             {
3731               if (slotno >= SPARC_FP_ARG_MAX)
3732                 return 0;
3733               regno = SPARC_FP_ARG_FIRST + slotno * 2;
3734               if (mode == SFmode)
3735                 regno++;
3736             }
3737           else
3738             {
3739               if (slotno >= SPARC_INT_ARG_MAX)
3740                 return -1;
3741               regno = regbase + slotno;
3742             }
3743         }
3744       break;
3745
3746     case BLKmode :
3747       /* For sparc64, objects requiring 16 byte alignment get it.  */
3748       if (TARGET_ARCH64)
3749         {
3750           if (type && TYPE_ALIGN (type) == 128 && (slotno & 1) != 0)
3751             slotno++, *ppadding = 1;
3752         }
3753
3754       if (TARGET_ARCH32
3755           || type && TREE_CODE (type) == UNION_TYPE)
3756         {
3757           if (slotno >= SPARC_INT_ARG_MAX)
3758             return -1;
3759           regno = regbase + slotno;
3760         }
3761       else
3762         {
3763           tree field;
3764           int intregs_p = 0, fpregs_p = 0;
3765           /* The ABI obviously doesn't specify how packed
3766              structures are passed.  These are defined to be passed
3767              in int regs if possible, otherwise memory.  */
3768           int packed_p = 0;
3769
3770           /* First see what kinds of registers we need.  */
3771           for (field = TYPE_FIELDS (type); field; field = TREE_CHAIN (field))
3772             {
3773               if (TREE_CODE (field) == FIELD_DECL)
3774                 {
3775                   if (TREE_CODE (TREE_TYPE (field)) == REAL_TYPE
3776                       && TARGET_FPU)
3777                     fpregs_p = 1;
3778                   else
3779                     intregs_p = 1;
3780                   if (DECL_PACKED (field))
3781                     packed_p = 1;
3782                 }
3783             }
3784           if (packed_p || !named)
3785             fpregs_p = 0, intregs_p = 1;
3786
3787           /* If all arg slots are filled, then must pass on stack.  */
3788           if (fpregs_p && slotno >= SPARC_FP_ARG_MAX)
3789             return -1;
3790           /* If there are only int args and all int arg slots are filled,
3791              then must pass on stack.  */
3792           if (!fpregs_p && intregs_p && slotno >= SPARC_INT_ARG_MAX)
3793             return -1;
3794           /* Note that even if all int arg slots are filled, fp members may
3795              still be passed in regs if such regs are available.
3796              *PREGNO isn't set because there may be more than one, it's up
3797              to the caller to compute them.  */
3798           return slotno;
3799         }
3800       break;
3801
3802     default :
3803       abort ();
3804     }
3805
3806   *pregno = regno;
3807   return slotno;
3808 }
3809
3810 /* Handle the FUNCTION_ARG macro.
3811    Determine where to put an argument to a function.
3812    Value is zero to push the argument on the stack,
3813    or a hard register in which to store the argument.
3814
3815    CUM is a variable of type CUMULATIVE_ARGS which gives info about
3816     the preceding args and about the function being called.
3817    MODE is the argument's machine mode.
3818    TYPE is the data type of the argument (as a tree).
3819     This is null for libcalls where that information may
3820     not be available.
3821    NAMED is nonzero if this argument is a named parameter
3822     (otherwise it is an extra parameter matching an ellipsis).
3823    INCOMING_P is zero for FUNCTION_ARG, nonzero for FUNCTION_INCOMING_ARG.  */
3824
3825 rtx
3826 function_arg (cum, mode, type, named, incoming_p)
3827      const CUMULATIVE_ARGS *cum;
3828      enum machine_mode mode;
3829      tree type;
3830      int named;
3831      int incoming_p;
3832 {
3833   int regbase = (incoming_p
3834                  ? SPARC_INCOMING_INT_ARG_FIRST
3835                  : SPARC_OUTGOING_INT_ARG_FIRST);
3836   int slotno, regno, padding;
3837   rtx reg;
3838
3839   slotno = function_arg_slotno (cum, mode, type, named, incoming_p,
3840                                 &regno, &padding);
3841
3842   if (slotno == -1)
3843     return 0;
3844
3845   if (TARGET_ARCH32)
3846     {
3847       reg = gen_rtx (REG, mode, regno);
3848       return reg;
3849     }
3850
3851   /* v9 fp args in reg slots beyond the int reg slots get passed in regs
3852      but also have the slot allocated for them.
3853      If no prototype is in scope fp values in register slots get passed
3854      in two places, either fp regs and int regs or fp regs and memory.  */
3855   if ((GET_MODE_CLASS (mode) == MODE_FLOAT
3856        || GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
3857       && SPARC_FP_REG_P (regno))
3858     {
3859       reg = gen_rtx (REG, mode, regno);
3860       if (cum->prototype_p || cum->libcall_p)
3861         {
3862           /* "* 2" because fp reg numbers are recorded in 4 byte
3863              quantities.  */
3864           /* ??? This will cause the value to be passed in the fp reg and
3865              in the stack.  When a prototype exists we want to pass the
3866              value in the reg but reserve space on the stack.  That's an
3867              optimization, and is deferred [for a bit].  */
3868           if ((regno - SPARC_FP_ARG_FIRST) >= SPARC_INT_ARG_MAX * 2)
3869             return gen_rtx (PARALLEL, mode,
3870                             gen_rtvec (2,
3871                                        gen_rtx (EXPR_LIST, VOIDmode,
3872                                                 NULL_RTX, const0_rtx),
3873                                        gen_rtx (EXPR_LIST, VOIDmode,
3874                                                 reg, const0_rtx)));
3875           else
3876             return reg;
3877         }
3878       else
3879         {
3880           if ((regno - SPARC_FP_ARG_FIRST) < SPARC_INT_ARG_MAX * 2)
3881             {
3882               int regbase = (incoming_p
3883                              ? SPARC_INCOMING_INT_ARG_FIRST
3884                              : SPARC_OUTGOING_INT_ARG_FIRST);
3885               int intreg = regbase + (regno - SPARC_FP_ARG_FIRST) / 2;
3886               return gen_rtx (PARALLEL, mode,
3887                               gen_rtvec (2,
3888                                          gen_rtx (EXPR_LIST, VOIDmode,
3889                                                   gen_rtx (REG, mode, intreg),
3890                                                   const0_rtx),
3891                                          gen_rtx (EXPR_LIST, VOIDmode,
3892                                                   reg, const0_rtx)));
3893             }
3894           else
3895             return gen_rtx (PARALLEL, mode,
3896                             gen_rtvec (2,
3897                                        gen_rtx (EXPR_LIST, VOIDmode,
3898                                                 NULL_RTX, const0_rtx),
3899                                        gen_rtx (EXPR_LIST, VOIDmode,
3900                                                 reg, const0_rtx)));
3901         }
3902     }
3903   else if (type && TREE_CODE (type) == RECORD_TYPE)
3904     {
3905       /* Structures up to 16 bytes in size are passed in arg slots on the
3906          stack and are promoted to registers where possible.  */
3907       tree field;
3908       rtx ret;
3909       int i;
3910       int nregs;
3911       /* Starting bit position of a sequence of integer fields, counted from
3912          msb of left most byte, -1 if last field wasn't an int.  */
3913       /* ??? This isn't entirely necessary, some simplification
3914          may be possible.  */
3915       int start_int_bitpos;
3916       /* Current bitpos in struct, counted from msb of left most byte.  */
3917       int bitpos, this_slotno;
3918       /* The ABI obviously doesn't specify how packed
3919          structures are passed.  These are defined to be passed
3920          in int regs if possible, otherwise memory.  */
3921       int packed_p = 0;
3922
3923       if (int_size_in_bytes (type) > 16)
3924         abort (); /* shouldn't get here */
3925
3926       /* We need to compute how many registers are needed so we can allocate
3927          the PARALLEL but before we can do that we need to know whether there
3928          are any packed fields.  If there are, int regs are used regardless of
3929          whether there are fp values present.  */
3930       for (field = TYPE_FIELDS (type); field; field = TREE_CHAIN (field))
3931         {
3932           if (TREE_CODE (field) == FIELD_DECL
3933               && DECL_PACKED (field))
3934             {
3935               packed_p = 1;
3936               break;
3937             }
3938         }
3939
3940       /* Compute how many registers we need.  */
3941       nregs = 0;
3942       start_int_bitpos = -1;
3943       for (field = TYPE_FIELDS (type); field; field = TREE_CHAIN (field))
3944         {
3945           bitpos = TREE_INT_CST_LOW (DECL_FIELD_BITPOS (field));
3946           this_slotno = slotno + bitpos / BITS_PER_WORD;
3947           if (TREE_CODE (field) == FIELD_DECL)
3948             {
3949               if (TREE_CODE (TREE_TYPE (field)) == REAL_TYPE
3950                   && TARGET_FPU
3951                   && ! packed_p
3952                   && named)
3953                 {
3954                   /* There's no need to check this_slotno < SPARC_FP_ARG MAX.
3955                      If it wasn't true we wouldn't be here.  */
3956                   nregs++;
3957                   start_int_bitpos = -1;
3958                 }
3959               else if (this_slotno < SPARC_INT_ARG_MAX)
3960                 {
3961                   if (start_int_bitpos == -1)
3962                     {
3963                       nregs++;
3964                       start_int_bitpos = bitpos;
3965                     }
3966                   else
3967                     {
3968                       if (bitpos % BITS_PER_WORD == 0)
3969                         nregs++;
3970                     }
3971                 }
3972             }
3973         }
3974       if (nregs == 0)
3975         abort ();
3976
3977       ret = gen_rtx (PARALLEL, BLKmode, rtvec_alloc (nregs + 1));
3978
3979       /* ??? This causes the entire struct to be passed in memory.
3980          This isn't necessary, but is left for later.  */
3981       XVECEXP (ret, 0, 0) = gen_rtx (EXPR_LIST, VOIDmode, NULL_RTX,
3982                                      const0_rtx);
3983
3984       /* Fill in the entries.  */
3985       start_int_bitpos = -1;
3986       for (i = 1, field = TYPE_FIELDS (type);
3987            field;
3988            field = TREE_CHAIN (field))
3989         {
3990           bitpos = TREE_INT_CST_LOW (DECL_FIELD_BITPOS (field));
3991           this_slotno = slotno + bitpos / BITS_PER_WORD;
3992           if (TREE_CODE (field) == FIELD_DECL)
3993             {
3994               if (TREE_CODE (TREE_TYPE (field)) == REAL_TYPE
3995                   && TARGET_FPU
3996                   && ! packed_p
3997                   && named)
3998                 {
3999                   reg = gen_rtx (REG, DECL_MODE (field),
4000                                  (SPARC_FP_ARG_FIRST + this_slotno * 2
4001                                   + (DECL_MODE (field) == SFmode
4002                                      && (bitpos & 32) != 0)));
4003                   XVECEXP (ret, 0, i) = gen_rtx (EXPR_LIST, VOIDmode, reg,
4004                                                  GEN_INT (bitpos / BITS_PER_UNIT));
4005                   i++;
4006                   start_int_bitpos = -1;
4007                 }
4008               else
4009                 {
4010                   if (this_slotno < SPARC_INT_ARG_MAX
4011                       && (start_int_bitpos == -1
4012                           || bitpos % BITS_PER_WORD == 0))
4013                     {
4014                       enum machine_mode mode;
4015
4016                       /* If this is the trailing part of a word, only load
4017                          that much into the register.  Otherwise load the
4018                          whole register.  Note that in the latter case we may
4019                          pick up unwanted bits.  It's not a problem at the
4020                          moment but may wish to revisit.  */
4021                       if (bitpos % BITS_PER_WORD != 0)
4022                         mode = mode_for_size (BITS_PER_WORD - bitpos % BITS_PER_WORD,
4023                                               MODE_INT, 0);
4024                       else
4025                         mode = word_mode;
4026
4027                       regno = regbase + this_slotno;
4028                       reg = gen_rtx (REG, mode, regno);
4029                       XVECEXP (ret, 0, i) = gen_rtx (EXPR_LIST, VOIDmode, reg,
4030                                                      GEN_INT (bitpos / BITS_PER_UNIT));
4031                       i++;
4032                       if (start_int_bitpos == -1)
4033                         start_int_bitpos = bitpos;
4034                     }
4035                 }
4036             }
4037         }
4038       if (i != nregs + 1)
4039         abort ();
4040
4041       return ret;
4042     }
4043   else if (type && TREE_CODE (type) == UNION_TYPE)
4044     {
4045       enum machine_mode mode;
4046       int bytes = int_size_in_bytes (type);
4047
4048       if (bytes > 16)
4049         abort ();
4050
4051       mode = mode_for_size (bytes * BITS_PER_UNIT, MODE_INT, 0);
4052       reg = gen_rtx (REG, mode, regno);
4053     }
4054   else
4055     {
4056       /* Scalar or complex int.  */
4057       reg = gen_rtx (REG, mode, regno);
4058     }
4059
4060   return reg;
4061 }
4062
4063 /* Handle the FUNCTION_ARG_PARTIAL_NREGS macro.
4064    For an arg passed partly in registers and partly in memory,
4065    this is the number of registers used.
4066    For args passed entirely in registers or entirely in memory, zero.
4067
4068    Any arg that starts in the first 6 regs but won't entirely fit in them
4069    needs partial registers on v8.  On v9, structures with integer
4070    values in arg slots 5,6 will be passed in %o5 and SP+176, and complex fp
4071    values that begin in the last fp reg [where "last fp reg" varies with the
4072    mode] will be split between that reg and memory.  */
4073
4074 int
4075 function_arg_partial_nregs (cum, mode, type, named)
4076      const CUMULATIVE_ARGS *cum;
4077      enum machine_mode mode;
4078      tree type;
4079      int named;
4080 {
4081   int slotno, regno, padding;
4082
4083   /* We pass 0 for incoming_p here, it doesn't matter.  */
4084   slotno = function_arg_slotno (cum, mode, type, named, 0, &regno, &padding);
4085
4086   if (slotno == -1)
4087     return 0;
4088
4089   if (TARGET_ARCH32)
4090     {
4091       if ((slotno + (mode == BLKmode
4092                      ? ROUND_ADVANCE (int_size_in_bytes (type))
4093                      : ROUND_ADVANCE (GET_MODE_SIZE (mode))))
4094           > NPARM_REGS (SImode))
4095         return NPARM_REGS (SImode) - slotno;
4096       return 0;
4097     }
4098   else
4099     {
4100       if (type && AGGREGATE_TYPE_P (type))
4101         {
4102           int size = int_size_in_bytes (type);
4103           int align = TYPE_ALIGN (type);
4104
4105           if (align == 16)
4106             slotno += slotno & 1;
4107           if (size > 8 && size <= 16
4108               && slotno == SPARC_INT_ARG_MAX - 1)
4109             return 1;
4110         }
4111       else if (GET_MODE_CLASS (mode) == MODE_COMPLEX_INT
4112                || (GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT
4113                    && ! TARGET_FPU))
4114         {
4115           if (GET_MODE_ALIGNMENT (mode) == 128)
4116             {
4117               slotno += slotno & 1;
4118               if (slotno == SPARC_INT_ARG_MAX - 2)
4119                 return 1;
4120             }
4121           else
4122             {
4123               if (slotno == SPARC_INT_ARG_MAX - 1)
4124                 return 1;
4125             }
4126         }
4127       else if (GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
4128         {
4129           if (GET_MODE_ALIGNMENT (mode) == 128)
4130             slotno += slotno & 1;
4131           if ((slotno + GET_MODE_SIZE (mode) / UNITS_PER_WORD)
4132               > SPARC_FP_ARG_MAX)
4133             return 1;
4134         }
4135       return 0;
4136     }
4137 }
4138
4139 /* Handle the FUNCTION_ARG_PASS_BY_REFERENCE macro.
4140    !v9: The SPARC ABI stipulates passing struct arguments (of any size) and
4141    quad-precision floats by invisible reference.
4142    v9: aggregates greater than 16 bytes are passed by reference.
4143    For Pascal, also pass arrays by reference.  */
4144
4145 int
4146 function_arg_pass_by_reference (cum, mode, type, named)
4147      const CUMULATIVE_ARGS *cum;
4148      enum machine_mode mode;
4149      tree type;
4150      int named;
4151 {
4152   if (TARGET_ARCH32)
4153     {
4154       return (type && AGGREGATE_TYPE_P (type)
4155               || mode == TFmode || mode == TCmode);
4156     }
4157   else
4158     {
4159       return ((type && TREE_CODE (type) == ARRAY_TYPE)
4160               || (type && AGGREGATE_TYPE_P (type)
4161                   && int_size_in_bytes (type) > 16));
4162     }
4163 }
4164
4165 /* Handle the FUNCTION_ARG_ADVANCE macro.
4166    Update the data in CUM to advance over an argument
4167    of mode MODE and data type TYPE.
4168    TYPE is null for libcalls where that information may not be available.  */
4169
4170 void
4171 function_arg_advance (cum, mode, type, named)
4172      CUMULATIVE_ARGS *cum;
4173      enum machine_mode mode;
4174      tree type;
4175      int named;
4176 {
4177   int slotno, regno, padding;
4178
4179   /* We pass 0 for incoming_p here, it doesn't matter.  */
4180   slotno = function_arg_slotno (cum, mode, type, named, 0, &regno, &padding);
4181
4182   /* If register required leading padding, add it.  */
4183   if (slotno != -1)
4184     cum->words += padding;
4185
4186   if (TARGET_ARCH32)
4187     {
4188       cum->words += (mode != BLKmode
4189                      ? ROUND_ADVANCE (GET_MODE_SIZE (mode))
4190                      : ROUND_ADVANCE (int_size_in_bytes (type)));
4191     }
4192   else
4193     {
4194       if (type && AGGREGATE_TYPE_P (type))
4195         {
4196           int size = int_size_in_bytes (type);
4197
4198           if (size <= 8)
4199             ++cum->words;
4200           else if (size <= 16)
4201             cum->words += 2;
4202           else /* passed by reference */
4203             ++cum->words;
4204         }
4205       else if (GET_MODE_CLASS (mode) == MODE_COMPLEX_INT)
4206         {
4207           cum->words += 2;
4208         }
4209       else if (GET_MODE_CLASS (mode) == MODE_COMPLEX_FLOAT)
4210         {
4211           cum->words += GET_MODE_SIZE (mode) / UNITS_PER_WORD;
4212         }
4213       else
4214         {
4215           cum->words += (mode != BLKmode
4216                          ? ROUND_ADVANCE (GET_MODE_SIZE (mode))
4217                          : ROUND_ADVANCE (int_size_in_bytes (type)));
4218         }
4219     }
4220 }
4221
4222 /* Handle the FUNCTION_ARG_PADDING macro.
4223    For the 64 bit ABI structs are always stored left shifted in their
4224    argument slot.  */
4225
4226 enum direction
4227 function_arg_padding (mode, type)
4228      enum machine_mode mode;
4229      tree type;
4230 {
4231   if (TARGET_ARCH64 && type && TREE_CODE (type) == RECORD_TYPE)
4232     {
4233       return upward;
4234     }
4235
4236   /* This is the default definition.  */
4237   return (! BYTES_BIG_ENDIAN
4238           ? upward
4239           : ((mode == BLKmode
4240               ? (type && TREE_CODE (TYPE_SIZE (type)) == INTEGER_CST
4241                  && int_size_in_bytes (type) < (PARM_BOUNDARY / BITS_PER_UNIT))
4242               : GET_MODE_BITSIZE (mode) < PARM_BOUNDARY)
4243              ? downward : upward));
4244 }
4245 \f
4246 /* Do what is necessary for `va_start'.  The argument is ignored.
4247
4248    We look at the current function to determine if stdarg or varargs
4249    is used and return the address of the first unnamed parameter.  */
4250
4251 rtx
4252 sparc_builtin_saveregs (arglist)
4253      tree arglist;
4254 {
4255   tree fntype = TREE_TYPE (current_function_decl);
4256   int stdarg = (TYPE_ARG_TYPES (fntype) != 0
4257                 && (TREE_VALUE (tree_last (TYPE_ARG_TYPES (fntype)))
4258                     != void_type_node));
4259   int first_reg = current_function_args_info.words;
4260   rtx address;
4261   int regno;
4262
4263   for (regno = first_reg; regno < NPARM_REGS (word_mode); regno++)
4264     emit_move_insn (gen_rtx (MEM, word_mode,
4265                              gen_rtx (PLUS, Pmode,
4266                                       frame_pointer_rtx,
4267                                       GEN_INT (STACK_POINTER_OFFSET
4268                                                + UNITS_PER_WORD * regno))),
4269                     gen_rtx (REG, word_mode,
4270                              BASE_INCOMING_ARG_REG (word_mode) + regno));
4271
4272   address = gen_rtx (PLUS, Pmode,
4273                      frame_pointer_rtx,
4274                      GEN_INT (STACK_POINTER_OFFSET
4275                               + UNITS_PER_WORD * first_reg));
4276
4277   if (flag_check_memory_usage
4278       && first_reg < NPARM_REGS (word_mode))
4279     emit_library_call (chkr_set_right_libfunc, 1, VOIDmode, 3,
4280                        address, ptr_mode,
4281                        GEN_INT (UNITS_PER_WORD
4282                                 * (NPARM_REGS (word_mode) - first_reg)),
4283                        TYPE_MODE (sizetype), GEN_INT (MEMORY_USE_RW),
4284                        TYPE_MODE (integer_type_node));
4285
4286   return address;
4287 }
4288 \f
4289 /* Return the string to output a conditional branch to LABEL, which is
4290    the operand number of the label.  OP is the conditional expression.
4291    XEXP (OP, 0) is assumed to be a condition code register (integer or
4292    floating point) and its mode specifies what kind of comparison we made.
4293
4294    REVERSED is non-zero if we should reverse the sense of the comparison.
4295
4296    ANNUL is non-zero if we should generate an annulling branch.
4297
4298    NOOP is non-zero if we have to follow this branch by a noop.  */
4299
4300 char *
4301 output_cbranch (op, label, reversed, annul, noop)
4302      rtx op;
4303      int label;
4304      int reversed, annul, noop;
4305 {
4306   static char string[20];
4307   enum rtx_code code = GET_CODE (op);
4308   rtx cc_reg = XEXP (op, 0);
4309   enum machine_mode mode = GET_MODE (cc_reg);
4310   static char v8_labelno[] = " %lX";
4311   static char v9_icc_labelno[] = " %%icc,%lX";
4312   static char v9_xcc_labelno[] = " %%xcc,%lX";
4313   static char v9_fcc_labelno[] = " %%fccX,%lY";
4314   char *labelno;
4315   int labeloff;
4316
4317   /* ??? !v9: FP branches cannot be preceded by another floating point insn.
4318      Because there is currently no concept of pre-delay slots, we can fix
4319      this only by always emitting a nop before a floating point branch.  */
4320
4321   if ((mode == CCFPmode || mode == CCFPEmode) && ! TARGET_V9)
4322     strcpy (string, "nop\n\t");
4323   else
4324     string[0] = '\0';
4325
4326   /* If not floating-point or if EQ or NE, we can just reverse the code.  */
4327   if (reversed
4328       && ((mode != CCFPmode && mode != CCFPEmode) || code == EQ || code == NE))
4329     code = reverse_condition (code), reversed = 0;
4330
4331   /* Start by writing the branch condition.  */
4332   switch (code)
4333     {
4334     case NE:
4335       if (mode == CCFPmode || mode == CCFPEmode)
4336         strcat (string, "fbne");
4337       else
4338         strcpy (string, "bne");
4339       break;
4340
4341     case EQ:
4342       if (mode == CCFPmode || mode == CCFPEmode)
4343         strcat (string, "fbe");
4344       else
4345         strcpy (string, "be");
4346       break;
4347
4348     case GE:
4349       if (mode == CCFPmode || mode == CCFPEmode)
4350         {
4351           if (reversed)
4352             strcat (string, "fbul");
4353           else
4354             strcat (string, "fbge");
4355         }
4356       else if (mode == CC_NOOVmode)
4357         strcpy (string, "bpos");
4358       else
4359         strcpy (string, "bge");
4360       break;
4361
4362     case GT:
4363       if (mode == CCFPmode || mode == CCFPEmode)
4364         {
4365           if (reversed)
4366             strcat (string, "fbule");
4367           else
4368             strcat (string, "fbg");
4369         }
4370       else
4371         strcpy (string, "bg");
4372       break;
4373
4374     case LE:
4375       if (mode == CCFPmode || mode == CCFPEmode)
4376         {
4377           if (reversed)
4378             strcat (string, "fbug");
4379           else
4380             strcat (string, "fble");
4381         }
4382       else
4383         strcpy (string, "ble");
4384       break;
4385
4386     case LT:
4387       if (mode == CCFPmode || mode == CCFPEmode)
4388         {
4389           if (reversed)
4390             strcat (string, "fbuge");
4391           else
4392             strcat (string, "fbl");
4393         }
4394       else if (mode == CC_NOOVmode)
4395         strcpy (string, "bneg");
4396       else
4397         strcpy (string, "bl");
4398       break;
4399
4400     case GEU:
4401       strcpy (string, "bgeu");
4402       break;
4403
4404     case GTU:
4405       strcpy (string, "bgu");
4406       break;
4407
4408     case LEU:
4409       strcpy (string, "bleu");
4410       break;
4411
4412     case LTU:
4413       strcpy (string, "blu");
4414       break;
4415     }
4416
4417   /* Now add the annulling, the label, and a possible noop.  */
4418   if (annul)
4419     strcat (string, ",a");
4420
4421   /* ??? If v9, optional prediction bit ",pt" or ",pf" goes here.  */
4422
4423   if (! TARGET_V9)
4424     {
4425       labeloff = 3;
4426       labelno = v8_labelno;
4427     }
4428   else
4429     {
4430       labeloff = 9;
4431       if (mode == CCFPmode || mode == CCFPEmode)
4432         {
4433           labeloff = 10;
4434           labelno = v9_fcc_labelno;
4435           /* Set the char indicating the number of the fcc reg to use.  */
4436           labelno[6] = REGNO (cc_reg) - SPARC_FIRST_V9_FCC_REG + '0';
4437         }
4438       else if (mode == CCXmode || mode == CCX_NOOVmode)
4439         labelno = v9_xcc_labelno;
4440       else
4441         labelno = v9_icc_labelno;
4442     }
4443   /* Set the char indicating the number of the operand containing the
4444      label_ref.  */
4445   labelno[labeloff] = label + '0';
4446   strcat (string, labelno);
4447
4448   if (noop)
4449     strcat (string, "\n\tnop");
4450
4451   return string;
4452 }
4453
4454 /* Return the string to output a conditional branch to LABEL, testing
4455    register REG.  LABEL is the operand number of the label; REG is the
4456    operand number of the reg.  OP is the conditional expression.  The mode
4457    of REG says what kind of comparison we made.
4458
4459    REVERSED is non-zero if we should reverse the sense of the comparison.
4460
4461    ANNUL is non-zero if we should generate an annulling branch.
4462
4463    NOOP is non-zero if we have to follow this branch by a noop.  */
4464
4465 char *
4466 output_v9branch (op, reg, label, reversed, annul, noop)
4467      rtx op;
4468      int reg, label;
4469      int reversed, annul, noop;
4470 {
4471   static char string[20];
4472   enum rtx_code code = GET_CODE (op);
4473   enum machine_mode mode = GET_MODE (XEXP (op, 0));
4474   static char labelno[] = " %X,%lX";
4475
4476   /* If not floating-point or if EQ or NE, we can just reverse the code.  */
4477   if (reversed)
4478     code = reverse_condition (code), reversed = 0;
4479
4480   /* Only 64 bit versions of these instructions exist.  */
4481   if (mode != DImode)
4482     abort ();
4483
4484   /* Start by writing the branch condition.  */
4485
4486   switch (code)
4487     {
4488     case NE:
4489       strcpy (string, "brnz");
4490       break;
4491
4492     case EQ:
4493       strcpy (string, "brz");
4494       break;
4495
4496     case GE:
4497       strcpy (string, "brgez");
4498       break;
4499
4500     case LT:
4501       strcpy (string, "brlz");
4502       break;
4503
4504     case LE:
4505       strcpy (string, "brlez");
4506       break;
4507
4508     case GT:
4509       strcpy (string, "brgz");
4510       break;
4511
4512     default:
4513       abort ();
4514     }
4515
4516   /* Now add the annulling, reg, label, and nop.  */
4517   if (annul)
4518     strcat (string, ",a");
4519
4520   /* ??? Optional prediction bit ",pt" or ",pf" goes here.  */
4521
4522   labelno[2] = reg + '0';
4523   labelno[6] = label + '0';
4524   strcat (string, labelno);
4525
4526   if (noop)
4527     strcat (string, "\n\tnop");
4528
4529   return string;
4530 }
4531
4532 /* Output assembler code to return from a function.  */
4533
4534 /* ??? v9: Update to use the new `return' instruction.  Also, add patterns to
4535    md file for the `return' instruction.  */
4536
4537 char *
4538 output_return (operands)
4539      rtx *operands;
4540 {
4541   if (leaf_label)
4542     {
4543       operands[0] = leaf_label;
4544       return "b,a %l0";
4545     }
4546   else if (leaf_function)
4547     {
4548       /* If we didn't allocate a frame pointer for the current function,
4549          the stack pointer might have been adjusted.  Output code to
4550          restore it now.  */
4551
4552       operands[0] = gen_rtx (CONST_INT, VOIDmode, actual_fsize);
4553
4554       /* Use sub of negated value in first two cases instead of add to
4555          allow actual_fsize == 4096.  */
4556
4557       if (actual_fsize <= 4096)
4558         {
4559           if (SKIP_CALLERS_UNIMP_P)
4560             return "jmp %%o7+12\n\tsub %%sp,-%0,%%sp";
4561           else
4562             return "retl\n\tsub %%sp,-%0,%%sp";
4563         }
4564       else if (actual_fsize <= 8192)
4565         {
4566           operands[0] = gen_rtx (CONST_INT, VOIDmode, actual_fsize - 4096);
4567           if (SKIP_CALLERS_UNIMP_P)
4568             return "sub %%sp,-4096,%%sp\n\tjmp %%o7+12\n\tsub %%sp,-%0,%%sp";
4569           else
4570             return "sub %%sp,-4096,%%sp\n\tretl\n\tsub %%sp,-%0,%%sp";
4571         }
4572       else if (SKIP_CALLERS_UNIMP_P)
4573         {
4574           if ((actual_fsize & 0x3ff) != 0)
4575             return "sethi %%hi(%a0),%%g1\n\tor %%g1,%%lo(%a0),%%g1\n\tjmp %%o7+12\n\tadd %%sp,%%g1,%%sp";
4576           else
4577             return "sethi %%hi(%a0),%%g1\n\tjmp %%o7+12\n\tadd %%sp,%%g1,%%sp";
4578         }
4579       else
4580         {
4581           if ((actual_fsize & 0x3ff) != 0)
4582             return "sethi %%hi(%a0),%%g1\n\tor %%g1,%%lo(%a0),%%g1\n\tretl\n\tadd %%sp,%%g1,%%sp";
4583           else
4584             return "sethi %%hi(%a0),%%g1\n\tretl\n\tadd %%sp,%%g1,%%sp";
4585         }
4586     }
4587   else
4588     {
4589       if (SKIP_CALLERS_UNIMP_P)
4590         return "jmp %%i7+12\n\trestore";
4591       else
4592         return "ret\n\trestore";
4593     }
4594 }
4595 \f
4596 /* Leaf functions and non-leaf functions have different needs.  */
4597
4598 static int
4599 reg_leaf_alloc_order[] = REG_LEAF_ALLOC_ORDER;
4600
4601 static int
4602 reg_nonleaf_alloc_order[] = REG_ALLOC_ORDER;
4603
4604 static int *reg_alloc_orders[] = {
4605   reg_leaf_alloc_order,
4606   reg_nonleaf_alloc_order};
4607
4608 void
4609 order_regs_for_local_alloc ()
4610 {
4611   static int last_order_nonleaf = 1;
4612
4613   if (regs_ever_live[15] != last_order_nonleaf)
4614     {
4615       last_order_nonleaf = !last_order_nonleaf;
4616       bcopy ((char *) reg_alloc_orders[last_order_nonleaf],
4617              (char *) reg_alloc_order, FIRST_PSEUDO_REGISTER * sizeof (int));
4618     }
4619 }
4620 \f
4621 /* Return 1 if REGNO (reg1) is even and REGNO (reg1) == REGNO (reg2) - 1.
4622    This makes them candidates for using ldd and std insns.
4623
4624    Note reg1 and reg2 *must* be hard registers.  To be sure we will
4625    abort if we are passed pseudo registers.  */
4626
4627 int
4628 registers_ok_for_ldd_peep (reg1, reg2)
4629      rtx reg1, reg2;
4630 {
4631   /* We might have been passed a SUBREG.  */
4632   if (GET_CODE (reg1) != REG || GET_CODE (reg2) != REG)
4633     return 0;
4634
4635   if (REGNO (reg1) % 2 != 0)
4636     return 0;
4637
4638   return (REGNO (reg1) == REGNO (reg2) - 1);
4639 }
4640
4641 /* Return 1 if addr1 and addr2 are suitable for use in an ldd or
4642    std insn.
4643
4644    This can only happen when addr1 and addr2 are consecutive memory
4645    locations (addr1 + 4 == addr2).  addr1 must also be aligned on a
4646    64 bit boundary (addr1 % 8 == 0).
4647
4648    We know %sp and %fp are kept aligned on a 64 bit boundary.  Other
4649    registers are assumed to *never* be properly aligned and are
4650    rejected.
4651
4652    Knowing %sp and %fp are kept aligned on a 64 bit boundary, we
4653    need only check that the offset for addr1 % 8 == 0.  */
4654
4655 int
4656 addrs_ok_for_ldd_peep (addr1, addr2)
4657       rtx addr1, addr2;
4658 {
4659   int reg1, offset1;
4660
4661   /* Extract a register number and offset (if used) from the first addr.  */
4662   if (GET_CODE (addr1) == PLUS)
4663     {
4664       /* If not a REG, return zero.  */
4665       if (GET_CODE (XEXP (addr1, 0)) != REG)
4666         return 0;
4667       else
4668         {
4669           reg1 = REGNO (XEXP (addr1, 0));
4670           /* The offset must be constant!  */
4671           if (GET_CODE (XEXP (addr1, 1)) != CONST_INT)
4672             return 0;
4673           offset1 = INTVAL (XEXP (addr1, 1));
4674         }
4675     }
4676   else if (GET_CODE (addr1) != REG)
4677     return 0;
4678   else
4679     {
4680       reg1 = REGNO (addr1);
4681       /* This was a simple (mem (reg)) expression.  Offset is 0.  */
4682       offset1 = 0;
4683     }
4684
4685   /* Make sure the second address is a (mem (plus (reg) (const_int).  */
4686   if (GET_CODE (addr2) != PLUS)
4687     return 0;
4688
4689   if (GET_CODE (XEXP (addr2, 0)) != REG
4690       || GET_CODE (XEXP (addr2, 1)) != CONST_INT)
4691     return 0;
4692
4693   /* Only %fp and %sp are allowed.  Additionally both addresses must
4694      use the same register.  */
4695   if (reg1 != FRAME_POINTER_REGNUM && reg1 != STACK_POINTER_REGNUM)
4696     return 0;
4697
4698   if (reg1 != REGNO (XEXP (addr2, 0)))
4699     return 0;
4700
4701   /* The first offset must be evenly divisible by 8 to ensure the
4702      address is 64 bit aligned.  */
4703   if (offset1 % 8 != 0)
4704     return 0;
4705
4706   /* The offset for the second addr must be 4 more than the first addr.  */
4707   if (INTVAL (XEXP (addr2, 1)) != offset1 + 4)
4708     return 0;
4709
4710   /* All the tests passed.  addr1 and addr2 are valid for ldd and std
4711      instructions.  */
4712   return 1;
4713 }
4714
4715 /* Return 1 if reg is a pseudo, or is the first register in
4716    a hard register pair.  This makes it a candidate for use in
4717    ldd and std insns.  */
4718
4719 int
4720 register_ok_for_ldd (reg)
4721      rtx reg;
4722 {
4723   /* We might have been passed a SUBREG.  */
4724   if (GET_CODE (reg) != REG)
4725     return 0;
4726
4727   if (REGNO (reg) < FIRST_PSEUDO_REGISTER)
4728     return (REGNO (reg) % 2 == 0);
4729   else
4730     return 1;
4731 }
4732 \f
4733 /* Print operand X (an rtx) in assembler syntax to file FILE.
4734    CODE is a letter or dot (`z' in `%z0') or 0 if no letter was specified.
4735    For `%' followed by punctuation, CODE is the punctuation and X is null.  */
4736
4737 void
4738 print_operand (file, x, code)
4739      FILE *file;
4740      rtx x;
4741      int code;
4742 {
4743   switch (code)
4744     {
4745     case '#':
4746       /* Output a 'nop' if there's nothing for the delay slot.  */
4747       if (dbr_sequence_length () == 0)
4748         fputs ("\n\tnop", file);
4749       return;
4750     case '*':
4751       /* Output an annul flag if there's nothing for the delay slot and we
4752          are optimizing.  This is always used with '(' below.  */
4753       /* Sun OS 4.1.1 dbx can't handle an annulled unconditional branch;
4754          this is a dbx bug.  So, we only do this when optimizing.  */
4755       if (dbr_sequence_length () == 0 && optimize)
4756         fputs (",a", file);
4757       return;
4758     case '(':
4759       /* Output a 'nop' if there's nothing for the delay slot and we are
4760          not optimizing.  This is always used with '*' above.  */
4761       if (dbr_sequence_length () == 0 && ! optimize)
4762         fputs ("\n\tnop", file);
4763       return;
4764     case '_':
4765       /* Output the Embedded Medium/Anywhere code model base register.  */
4766       fputs (EMBMEDANY_BASE_REG, file);
4767       return;
4768     case '@':
4769       /* Print out what we are using as the frame pointer.  This might
4770          be %fp, or might be %sp+offset.  */
4771       /* ??? What if offset is too big? Perhaps the caller knows it isn't? */
4772       fprintf (file, "%s+%d", frame_base_name, frame_base_offset);
4773       return;
4774     case 'Y':
4775       /* Adjust the operand to take into account a RESTORE operation.  */
4776       if (GET_CODE (x) != REG)
4777         output_operand_lossage ("Invalid %%Y operand");
4778       else if (REGNO (x) < 8)
4779         fputs (reg_names[REGNO (x)], file);
4780       else if (REGNO (x) >= 24 && REGNO (x) < 32)
4781         fputs (reg_names[REGNO (x)-16], file);
4782       else
4783         output_operand_lossage ("Invalid %%Y operand");
4784       return;
4785     case 'L':
4786       /* Print out the low order register name of a register pair.  */
4787       if (WORDS_BIG_ENDIAN)
4788         fputs (reg_names[REGNO (x)+1], file);
4789       else
4790         fputs (reg_names[REGNO (x)], file);
4791       return;
4792     case 'H':
4793       /* Print out the high order register name of a register pair.  */
4794       if (WORDS_BIG_ENDIAN)
4795         fputs (reg_names[REGNO (x)], file);
4796       else
4797         fputs (reg_names[REGNO (x)+1], file);
4798       return;
4799     case 'R':
4800       /* Print out the second register name of a register pair or quad.
4801          I.e., R (%o0) => %o1.  */
4802       fputs (reg_names[REGNO (x)+1], file);
4803       return;
4804     case 'S':
4805       /* Print out the third register name of a register quad.
4806          I.e., S (%o0) => %o2.  */
4807       fputs (reg_names[REGNO (x)+2], file);
4808       return;
4809     case 'T':
4810       /* Print out the fourth register name of a register quad.
4811          I.e., T (%o0) => %o3.  */
4812       fputs (reg_names[REGNO (x)+3], file);
4813       return;
4814     case 'x':
4815       /* Print a condition code register.  */
4816       if (REGNO (x) == SPARC_ICC_REG)
4817         {
4818           /* We don't handle CC[X]_NOOVmode because they're not supposed
4819              to occur here.  */
4820           if (GET_MODE (x) == CCmode)
4821             fputs ("%icc", file);
4822           else if (GET_MODE (x) == CCXmode)
4823             fputs ("%xcc", file);
4824           else
4825             abort ();
4826         }
4827       else
4828         /* %fccN register */
4829         fputs (reg_names[REGNO (x)], file);
4830       return;
4831     case 'm':
4832       /* Print the operand's address only.  */
4833       output_address (XEXP (x, 0));
4834       return;
4835     case 'r':
4836       /* In this case we need a register.  Use %g0 if the
4837          operand is const0_rtx.  */
4838       if (x == const0_rtx
4839           || (GET_MODE (x) != VOIDmode && x == CONST0_RTX (GET_MODE (x))))
4840         {
4841           fputs ("%g0", file);
4842           return;
4843         }
4844       else
4845         break;
4846
4847     case 'A':
4848       switch (GET_CODE (x))
4849         {
4850         case IOR: fputs ("or", file); break;
4851         case AND: fputs ("and", file); break;
4852         case XOR: fputs ("xor", file); break;
4853         default: output_operand_lossage ("Invalid %%A operand");
4854         }
4855       return;
4856
4857     case 'B':
4858       switch (GET_CODE (x))
4859         {
4860         case IOR: fputs ("orn", file); break;
4861         case AND: fputs ("andn", file); break;
4862         case XOR: fputs ("xnor", file); break;
4863         default: output_operand_lossage ("Invalid %%B operand");
4864         }
4865       return;
4866
4867       /* These are used by the conditional move instructions.  */
4868     case 'c' :
4869     case 'C':
4870       {
4871         enum rtx_code rc = (code == 'c'
4872                             ? reverse_condition (GET_CODE (x))
4873                             : GET_CODE (x));
4874         switch (rc)
4875           {
4876           case NE: fputs ("ne", file); break;
4877           case EQ: fputs ("e", file); break;
4878           case GE: fputs ("ge", file); break;
4879           case GT: fputs ("g", file); break;
4880           case LE: fputs ("le", file); break;
4881           case LT: fputs ("l", file); break;
4882           case GEU: fputs ("geu", file); break;
4883           case GTU: fputs ("gu", file); break;
4884           case LEU: fputs ("leu", file); break;
4885           case LTU: fputs ("lu", file); break;
4886           default: output_operand_lossage (code == 'c'
4887                                            ? "Invalid %%c operand"
4888                                            : "Invalid %%C operand");
4889           }
4890         return;
4891       }
4892
4893       /* These are used by the movr instruction pattern.  */
4894     case 'd':
4895     case 'D':
4896       {
4897         enum rtx_code rc = (code == 'd'
4898                             ? reverse_condition (GET_CODE (x))
4899                             : GET_CODE (x));
4900         switch (rc)
4901           {
4902           case NE: fputs ("ne", file); break;
4903           case EQ: fputs ("e", file); break;
4904           case GE: fputs ("gez", file); break;
4905           case LT: fputs ("lz", file); break;
4906           case LE: fputs ("lez", file); break;
4907           case GT: fputs ("gz", file); break;
4908           default: output_operand_lossage (code == 'd'
4909                                            ? "Invalid %%d operand"
4910                                            : "Invalid %%D operand");
4911           }
4912         return;
4913       }
4914
4915     case 'b':
4916       {
4917         /* Print a sign-extended character.  */
4918         int i = INTVAL (x) & 0xff;
4919         if (i & 0x80)
4920           i |= 0xffffff00;
4921         fprintf (file, "%d", i);
4922         return;
4923       }
4924
4925     case 'f':
4926       /* Operand must be a MEM; write its address.  */
4927       if (GET_CODE (x) != MEM)
4928         output_operand_lossage ("Invalid %%f operand");
4929       output_address (XEXP (x, 0));
4930       return;
4931
4932     case 0:
4933       /* Do nothing special.  */
4934       break;
4935
4936     default:
4937       /* Undocumented flag.  */
4938       output_operand_lossage ("invalid operand output code");
4939     }
4940
4941   if (GET_CODE (x) == REG)
4942     fputs (reg_names[REGNO (x)], file);
4943   else if (GET_CODE (x) == MEM)
4944     {
4945       fputc ('[', file);
4946         /* Poor Sun assembler doesn't understand absolute addressing.  */
4947       if (CONSTANT_P (XEXP (x, 0))
4948           && ! TARGET_LIVE_G0)
4949         fputs ("%g0+", file);
4950       output_address (XEXP (x, 0));
4951       fputc (']', file);
4952     }
4953   else if (GET_CODE (x) == HIGH)
4954     {
4955       fputs ("%hi(", file);
4956       output_addr_const (file, XEXP (x, 0));
4957       fputc (')', file);
4958     }
4959   else if (GET_CODE (x) == LO_SUM)
4960     {
4961       print_operand (file, XEXP (x, 0), 0);
4962       fputs ("+%lo(", file);
4963       output_addr_const (file, XEXP (x, 1));
4964       fputc (')', file);
4965     }
4966   else if (GET_CODE (x) == CONST_DOUBLE
4967            && (GET_MODE (x) == VOIDmode
4968                || GET_MODE_CLASS (GET_MODE (x)) == MODE_INT))
4969     {
4970       if (CONST_DOUBLE_HIGH (x) == 0)
4971         fprintf (file, "%u", CONST_DOUBLE_LOW (x));
4972       else if (CONST_DOUBLE_HIGH (x) == -1
4973                && CONST_DOUBLE_LOW (x) < 0)
4974         fprintf (file, "%d", CONST_DOUBLE_LOW (x));
4975       else
4976         output_operand_lossage ("long long constant not a valid immediate operand");
4977     }
4978   else if (GET_CODE (x) == CONST_DOUBLE)
4979     output_operand_lossage ("floating point constant not a valid immediate operand");
4980   else { output_addr_const (file, x); }
4981 }
4982 \f
4983 /* This function outputs assembler code for VALUE to FILE, where VALUE is
4984    a 64 bit (DImode) value.  */
4985
4986 /* ??? If there is a 64 bit counterpart to .word that the assembler
4987    understands, then using that would simply this code greatly.  */
4988 /* ??? We only output .xword's for symbols and only then in environments
4989    where the assembler can handle them.  */
4990
4991 void
4992 output_double_int (file, value)
4993      FILE *file;
4994      rtx value;
4995 {
4996   if (GET_CODE (value) == CONST_INT)
4997     {
4998       /* ??? This has endianness issues.  */
4999 #if HOST_BITS_PER_WIDE_INT == 64
5000       HOST_WIDE_INT xword = INTVAL (value);
5001       HOST_WIDE_INT high, low;
5002
5003       high = (xword >> 32) & 0xffffffff;
5004       low  = xword & 0xffffffff;
5005       ASM_OUTPUT_INT (file, gen_rtx (CONST_INT, VOIDmode, high));
5006       ASM_OUTPUT_INT (file, gen_rtx (CONST_INT, VOIDmode, low));
5007 #else
5008       if (INTVAL (value) < 0)
5009         ASM_OUTPUT_INT (file, constm1_rtx);
5010       else
5011         ASM_OUTPUT_INT (file, const0_rtx);
5012       ASM_OUTPUT_INT (file, value);
5013 #endif
5014     }
5015   else if (GET_CODE (value) == CONST_DOUBLE)
5016     {
5017       ASM_OUTPUT_INT (file, gen_rtx (CONST_INT, VOIDmode,
5018                                      CONST_DOUBLE_HIGH (value)));
5019       ASM_OUTPUT_INT (file, gen_rtx (CONST_INT, VOIDmode,
5020                                      CONST_DOUBLE_LOW (value)));
5021     }
5022   else if (GET_CODE (value) == SYMBOL_REF
5023            || GET_CODE (value) == CONST
5024            || GET_CODE (value) == PLUS
5025            || (TARGET_ARCH64 &&
5026                (GET_CODE (value) == LABEL_REF
5027                 || GET_CODE (value) == CODE_LABEL
5028                 || GET_CODE (value) == MINUS)))
5029     {
5030       if (!TARGET_V9 || TARGET_CM_MEDLOW)
5031         {
5032           ASM_OUTPUT_INT (file, const0_rtx);
5033           ASM_OUTPUT_INT (file, value);
5034         }
5035       else
5036         {
5037           fprintf (file, "\t%s\t", ASM_LONGLONG);
5038           output_addr_const (file, value);
5039           fprintf (file, "\n");
5040         }
5041     }
5042   else
5043     abort ();
5044 }
5045 \f
5046 /* Return the value of a code used in the .proc pseudo-op that says
5047    what kind of result this function returns.  For non-C types, we pick
5048    the closest C type.  */
5049
5050 #ifndef CHAR_TYPE_SIZE
5051 #define CHAR_TYPE_SIZE BITS_PER_UNIT
5052 #endif
5053
5054 #ifndef SHORT_TYPE_SIZE
5055 #define SHORT_TYPE_SIZE (BITS_PER_UNIT * 2)
5056 #endif
5057
5058 #ifndef INT_TYPE_SIZE
5059 #define INT_TYPE_SIZE BITS_PER_WORD
5060 #endif
5061
5062 #ifndef LONG_TYPE_SIZE
5063 #define LONG_TYPE_SIZE BITS_PER_WORD
5064 #endif
5065
5066 #ifndef LONG_LONG_TYPE_SIZE
5067 #define LONG_LONG_TYPE_SIZE (BITS_PER_WORD * 2)
5068 #endif
5069
5070 #ifndef FLOAT_TYPE_SIZE
5071 #define FLOAT_TYPE_SIZE BITS_PER_WORD
5072 #endif
5073
5074 #ifndef DOUBLE_TYPE_SIZE
5075 #define DOUBLE_TYPE_SIZE (BITS_PER_WORD * 2)
5076 #endif
5077
5078 #ifndef LONG_DOUBLE_TYPE_SIZE
5079 #define LONG_DOUBLE_TYPE_SIZE (BITS_PER_WORD * 2)
5080 #endif
5081
5082 unsigned long
5083 sparc_type_code (type)
5084      register tree type;
5085 {
5086   register unsigned long qualifiers = 0;
5087   register unsigned shift = 6;
5088
5089   /* Only the first 30 bits of the qualifier are valid.  We must refrain from
5090      setting more, since some assemblers will give an error for this.  Also,
5091      we must be careful to avoid shifts of 32 bits or more to avoid getting
5092      unpredictable results.  */
5093
5094   for (;;)
5095     {
5096       switch (TREE_CODE (type))
5097         {
5098         case ERROR_MARK:
5099           return qualifiers;
5100
5101         case ARRAY_TYPE:
5102           if (shift < 30)
5103             qualifiers |= (3 << shift);
5104           shift += 2;
5105           type = TREE_TYPE (type);
5106           break;
5107
5108         case FUNCTION_TYPE:
5109         case METHOD_TYPE:
5110           if (shift < 30)
5111             qualifiers |= (2 << shift);
5112           shift += 2;
5113           type = TREE_TYPE (type);
5114           break;
5115
5116         case POINTER_TYPE:
5117         case REFERENCE_TYPE:
5118         case OFFSET_TYPE:
5119           if (shift < 30)
5120             qualifiers |= (1 << shift);
5121           shift += 2;
5122           type = TREE_TYPE (type);
5123           break;
5124
5125         case RECORD_TYPE:
5126           return (qualifiers | 8);
5127
5128         case UNION_TYPE:
5129         case QUAL_UNION_TYPE:
5130           return (qualifiers | 9);
5131
5132         case ENUMERAL_TYPE:
5133           return (qualifiers | 10);
5134
5135         case VOID_TYPE:
5136           return (qualifiers | 16);
5137
5138         case INTEGER_TYPE:
5139           /* If this is a range type, consider it to be the underlying
5140              type.  */
5141           if (TREE_TYPE (type) != 0)
5142             {
5143               type = TREE_TYPE (type);
5144               break;
5145             }
5146
5147           /* Carefully distinguish all the standard types of C,
5148              without messing up if the language is not C.  We do this by
5149              testing TYPE_PRECISION and TREE_UNSIGNED.  The old code used to
5150              look at both the names and the above fields, but that's redundant.
5151              Any type whose size is between two C types will be considered
5152              to be the wider of the two types.  Also, we do not have a
5153              special code to use for "long long", so anything wider than
5154              long is treated the same.  Note that we can't distinguish
5155              between "int" and "long" in this code if they are the same
5156              size, but that's fine, since neither can the assembler.  */
5157
5158           if (TYPE_PRECISION (type) <= CHAR_TYPE_SIZE)
5159             return (qualifiers | (TREE_UNSIGNED (type) ? 12 : 2));
5160
5161           else if (TYPE_PRECISION (type) <= SHORT_TYPE_SIZE)
5162             return (qualifiers | (TREE_UNSIGNED (type) ? 13 : 3));
5163
5164           else if (TYPE_PRECISION (type) <= INT_TYPE_SIZE)
5165             return (qualifiers | (TREE_UNSIGNED (type) ? 14 : 4));
5166
5167           else
5168             return (qualifiers | (TREE_UNSIGNED (type) ? 15 : 5));
5169
5170         case REAL_TYPE:
5171           /* Carefully distinguish all the standard types of C,
5172              without messing up if the language is not C.  */
5173
5174           if (TYPE_PRECISION (type) == FLOAT_TYPE_SIZE)
5175             return (qualifiers | 6);
5176
5177           else
5178             return (qualifiers | 7);
5179
5180         case COMPLEX_TYPE:      /* GNU Fortran COMPLEX type.  */
5181           /* ??? We need to distinguish between double and float complex types,
5182              but I don't know how yet because I can't reach this code from
5183              existing front-ends.  */
5184           return (qualifiers | 7);      /* Who knows? */
5185
5186         case CHAR_TYPE:         /* GNU Pascal CHAR type.  Not used in C.  */
5187         case BOOLEAN_TYPE:      /* GNU Fortran BOOLEAN type.  */
5188         case FILE_TYPE:         /* GNU Pascal FILE type.  */
5189         case SET_TYPE:          /* GNU Pascal SET type.  */
5190         case LANG_TYPE:         /* ? */
5191           return qualifiers;
5192
5193         default:
5194           abort ();             /* Not a type! */
5195         }
5196     }
5197 }
5198 \f
5199 /* Nested function support.  */
5200
5201 /* Emit RTL insns to initialize the variable parts of a trampoline.
5202    FNADDR is an RTX for the address of the function's pure code.
5203    CXT is an RTX for the static chain value for the function.
5204
5205    This takes 16 insns: 2 shifts & 2 ands (to split up addresses), 4 sethi
5206    (to load in opcodes), 4 iors (to merge address and opcodes), and 4 writes
5207    (to store insns).  This is a bit excessive.  Perhaps a different
5208    mechanism would be better here.
5209
5210    Emit enough FLUSH insns to synchronize the data and instruction caches.  */
5211
5212 void
5213 sparc_initialize_trampoline (tramp, fnaddr, cxt)
5214      rtx tramp, fnaddr, cxt;
5215 {
5216   rtx high_cxt = expand_shift (RSHIFT_EXPR, SImode, cxt,
5217                               size_int (10), 0, 1);
5218   rtx high_fn = expand_shift (RSHIFT_EXPR, SImode, fnaddr,
5219                              size_int (10), 0, 1);
5220   rtx low_cxt = expand_and (cxt, gen_rtx (CONST_INT, VOIDmode, 0x3ff), 0);
5221   rtx low_fn = expand_and (fnaddr, gen_rtx (CONST_INT, VOIDmode, 0x3ff), 0);
5222   rtx g1_sethi = gen_rtx (HIGH, SImode,
5223                           gen_rtx (CONST_INT, VOIDmode, 0x03000000));
5224   rtx g2_sethi = gen_rtx (HIGH, SImode,
5225                           gen_rtx (CONST_INT, VOIDmode, 0x05000000));
5226   rtx g1_ori = gen_rtx (HIGH, SImode,
5227                         gen_rtx (CONST_INT, VOIDmode, 0x82106000));
5228   rtx g2_ori = gen_rtx (HIGH, SImode,
5229                         gen_rtx (CONST_INT, VOIDmode, 0x8410A000));
5230   rtx tem = gen_reg_rtx (SImode);
5231   emit_move_insn (tem, g1_sethi);
5232   emit_insn (gen_iorsi3 (high_fn, high_fn, tem));
5233   emit_move_insn (gen_rtx (MEM, SImode, plus_constant (tramp, 0)), high_fn);
5234   emit_move_insn (tem, g1_ori);
5235   emit_insn (gen_iorsi3 (low_fn, low_fn, tem));
5236   emit_move_insn (gen_rtx (MEM, SImode, plus_constant (tramp, 4)), low_fn);
5237   emit_move_insn (tem, g2_sethi);
5238   emit_insn (gen_iorsi3 (high_cxt, high_cxt, tem));
5239   emit_move_insn (gen_rtx (MEM, SImode, plus_constant (tramp, 8)), high_cxt);
5240   emit_move_insn (tem, g2_ori);
5241   emit_insn (gen_iorsi3 (low_cxt, low_cxt, tem));
5242   emit_move_insn (gen_rtx (MEM, SImode, plus_constant (tramp, 16)), low_cxt);
5243   emit_insn (gen_flush (validize_mem (gen_rtx (MEM, SImode, tramp))));
5244   emit_insn (gen_flush (validize_mem (gen_rtx (MEM, SImode,
5245                                                plus_constant (tramp, 8)))));
5246   emit_insn (gen_flush (validize_mem (gen_rtx (MEM, SImode,
5247                                                plus_constant (tramp, 16)))));
5248 }
5249
5250 /* The 64 bit version is simpler because it makes more sense to load the
5251    values as "immediate" data out of the trampoline.  It's also easier since
5252    we can read the PC without clobbering a register.  */
5253
5254 void
5255 sparc64_initialize_trampoline (tramp, fnaddr, cxt)
5256      rtx tramp, fnaddr, cxt;
5257 {
5258   emit_move_insn (gen_rtx (MEM, DImode, plus_constant (tramp, 24)), cxt);
5259   emit_move_insn (gen_rtx (MEM, DImode, plus_constant (tramp, 32)), fnaddr);
5260   emit_insn (gen_flush (validize_mem (gen_rtx (MEM, DImode, tramp))));
5261   emit_insn (gen_flush (validize_mem (gen_rtx (MEM, DImode,
5262                                                plus_constant (tramp, 8)))));
5263   emit_insn (gen_flush (validize_mem (gen_rtx (MEM, DImode,
5264                                                plus_constant (tramp, 16)))));
5265   emit_insn (gen_flush (validize_mem (gen_rtx (MEM, DImode,
5266                                                plus_constant (tramp, 24)))));
5267   emit_insn (gen_flush (validize_mem (gen_rtx (MEM, DImode,
5268                                                plus_constant (tramp, 32)))));
5269 }
5270 \f
5271 /* Subroutines to support a flat (single) register window calling
5272    convention.  */
5273
5274 /* Single-register window sparc stack frames look like:
5275
5276              Before call                        After call
5277         +-----------------------+       +-----------------------+
5278    high |                       |       |                       |
5279    mem  |  caller's temps.      |       |  caller's temps.      |
5280         |                       |       |                       |
5281         +-----------------------+       +-----------------------+
5282         |                       |       |                       |
5283         |  arguments on stack.  |       |  arguments on stack.  |
5284         |                       |       |                       |
5285         +-----------------------+FP+92->+-----------------------+
5286         |  6 words to save      |       |  6 words to save      |
5287         |  arguments passed     |       |  arguments passed     |
5288         |  in registers, even   |       |  in registers, even   |
5289         |  if not passed.       |       |  if not passed.       |
5290  SP+68->+-----------------------+FP+68->+-----------------------+
5291         | 1 word struct addr    |       | 1 word struct addr    |
5292         +-----------------------+FP+64->+-----------------------+
5293         |                       |       |                       |
5294         | 16 word reg save area |       | 16 word reg save area |
5295         |                       |       |                       |
5296     SP->+-----------------------+   FP->+-----------------------+
5297                                         | 4 word area for       |
5298                                         | fp/alu reg moves      |
5299                                  FP-16->+-----------------------+
5300                                         |                       |
5301                                         |  local variables      |
5302                                         |                       |
5303                                         +-----------------------+
5304                                         |                       |
5305                                         |  fp register save     |
5306                                         |                       |
5307                                         +-----------------------+
5308                                         |                       |
5309                                         |  gp register save     |
5310                                         |                       |
5311                                         +-----------------------+
5312                                         |                       |
5313                                         |  alloca allocations   |
5314                                         |                       |
5315                                         +-----------------------+
5316                                         |                       |
5317                                         |  arguments on stack   |
5318                                         |                       |
5319                                  SP+92->+-----------------------+
5320                                         |  6 words to save      |
5321                                         |  arguments passed     |
5322                                         |  in registers, even   |
5323    low                                  |  if not passed.       |
5324    memory                        SP+68->+-----------------------+
5325                                         | 1 word struct addr    |
5326                                  SP+64->+-----------------------+
5327                                         |                       |
5328                                         I 16 word reg save area |
5329                                         |                       |
5330                                     SP->+-----------------------+  */
5331
5332 /* Structure to be filled in by sparc_flat_compute_frame_size with register
5333    save masks, and offsets for the current function.  */
5334
5335 struct sparc_frame_info
5336 {
5337   unsigned long total_size;     /* # bytes that the entire frame takes up.  */
5338   unsigned long var_size;       /* # bytes that variables take up.  */
5339   unsigned long args_size;      /* # bytes that outgoing arguments take up.  */
5340   unsigned long extra_size;     /* # bytes of extra gunk.  */
5341   unsigned int  gp_reg_size;    /* # bytes needed to store gp regs.  */
5342   unsigned int  fp_reg_size;    /* # bytes needed to store fp regs.  */
5343   unsigned long gmask;          /* Mask of saved gp registers.  */
5344   unsigned long fmask;          /* Mask of saved fp registers.  */
5345   unsigned long reg_offset;     /* Offset from new sp to store regs.  */
5346   int           initialized;    /* Nonzero if frame size already calculated.  */
5347 };
5348
5349 /* Current frame information calculated by sparc_flat_compute_frame_size.  */
5350 struct sparc_frame_info current_frame_info;
5351
5352 /* Zero structure to initialize current_frame_info.  */
5353 struct sparc_frame_info zero_frame_info;
5354
5355 /* Tell prologue and epilogue if register REGNO should be saved / restored.  */
5356
5357 #define RETURN_ADDR_REGNUM 15
5358 #define FRAME_POINTER_MASK (1 << (FRAME_POINTER_REGNUM))
5359 #define RETURN_ADDR_MASK (1 << (RETURN_ADDR_REGNUM))
5360
5361 #define MUST_SAVE_REGISTER(regno) \
5362  ((regs_ever_live[regno] && !call_used_regs[regno])             \
5363   || (regno == FRAME_POINTER_REGNUM && frame_pointer_needed)    \
5364   || (regno == RETURN_ADDR_REGNUM && regs_ever_live[RETURN_ADDR_REGNUM]))
5365
5366 /* Return the bytes needed to compute the frame pointer from the current
5367    stack pointer.  */
5368
5369 unsigned long
5370 sparc_flat_compute_frame_size (size)
5371      int size;                  /* # of var. bytes allocated.  */
5372 {
5373   int regno;
5374   unsigned long total_size;     /* # bytes that the entire frame takes up.  */
5375   unsigned long var_size;       /* # bytes that variables take up.  */
5376   unsigned long args_size;      /* # bytes that outgoing arguments take up.  */
5377   unsigned long extra_size;     /* # extra bytes.  */
5378   unsigned int  gp_reg_size;    /* # bytes needed to store gp regs.  */
5379   unsigned int  fp_reg_size;    /* # bytes needed to store fp regs.  */
5380   unsigned long gmask;          /* Mask of saved gp registers.  */
5381   unsigned long fmask;          /* Mask of saved fp registers.  */
5382   unsigned long reg_offset;     /* Offset to register save area.  */
5383   int           need_aligned_p; /* 1 if need the save area 8 byte aligned.  */
5384
5385   /* This is the size of the 16 word reg save area, 1 word struct addr
5386      area, and 4 word fp/alu register copy area.  */
5387   extra_size     = -STARTING_FRAME_OFFSET + FIRST_PARM_OFFSET(0);
5388   var_size       = size;
5389   /* Also include the size needed for the 6 parameter registers.  */
5390   args_size      = current_function_outgoing_args_size + 24;
5391   total_size     = var_size + args_size + extra_size;
5392   gp_reg_size    = 0;
5393   fp_reg_size    = 0;
5394   gmask          = 0;
5395   fmask          = 0;
5396   reg_offset     = 0;
5397   need_aligned_p = 0;
5398
5399   /* Calculate space needed for gp registers.  */
5400   for (regno = 1; regno <= 31; regno++)
5401     {
5402       if (MUST_SAVE_REGISTER (regno))
5403         {
5404           /* If we need to save two regs in a row, ensure there's room to bump
5405              up the address to align it to a doubleword boundary.  */
5406           if ((regno & 0x1) == 0 && MUST_SAVE_REGISTER (regno+1))
5407             {
5408               if (gp_reg_size % 8 != 0)
5409                 gp_reg_size += 4;
5410               gp_reg_size += 2 * UNITS_PER_WORD;
5411               gmask |= 3 << regno;
5412               regno++;
5413               need_aligned_p = 1;
5414             }
5415           else
5416             {
5417               gp_reg_size += UNITS_PER_WORD;
5418               gmask |= 1 << regno;
5419             }
5420         }
5421     }
5422
5423   /* Calculate space needed for fp registers.  */
5424   for (regno = 32; regno <= 63; regno++)
5425     {
5426       if (regs_ever_live[regno] && !call_used_regs[regno])
5427         {
5428           fp_reg_size += UNITS_PER_WORD;
5429           fmask |= 1 << (regno - 32);
5430         }
5431     }
5432
5433   if (gmask || fmask)
5434     {
5435       int n;
5436       reg_offset = FIRST_PARM_OFFSET(0) + args_size;
5437       /* Ensure save area is 8 byte aligned if we need it.  */
5438       n = reg_offset % 8;
5439       if (need_aligned_p && n != 0)
5440         {
5441           total_size += 8 - n;
5442           reg_offset += 8 - n;
5443         }
5444       total_size += gp_reg_size + fp_reg_size;
5445     }
5446
5447   /* ??? This looks a little suspicious.  Clarify.  */
5448   if (total_size == extra_size)
5449     total_size = extra_size = 0;
5450
5451   total_size = SPARC_STACK_ALIGN (total_size);
5452
5453   /* Save other computed information.  */
5454   current_frame_info.total_size  = total_size;
5455   current_frame_info.var_size    = var_size;
5456   current_frame_info.args_size   = args_size;
5457   current_frame_info.extra_size  = extra_size;
5458   current_frame_info.gp_reg_size = gp_reg_size;
5459   current_frame_info.fp_reg_size = fp_reg_size;
5460   current_frame_info.gmask       = gmask;
5461   current_frame_info.fmask       = fmask;
5462   current_frame_info.reg_offset  = reg_offset;
5463   current_frame_info.initialized = reload_completed;
5464
5465   /* Ok, we're done.  */
5466   return total_size;
5467 }
5468 \f
5469 /* Save/restore registers in GMASK and FMASK at register BASE_REG plus offset
5470    OFFSET.
5471
5472    BASE_REG must be 8 byte aligned.  This allows us to test OFFSET for
5473    appropriate alignment and use DOUBLEWORD_OP when we can.  We assume
5474    [BASE_REG+OFFSET] will always be a valid address.
5475
5476    WORD_OP is either "st" for save, "ld" for restore.
5477    DOUBLEWORD_OP is either "std" for save, "ldd" for restore.  */
5478
5479 void
5480 sparc_flat_save_restore (file, base_reg, offset, gmask, fmask, word_op,
5481                          doubleword_op, base_offset)
5482      FILE *file;
5483      char *base_reg;
5484      unsigned int offset;
5485      unsigned long gmask;
5486      unsigned long fmask;
5487      char *word_op;
5488      char *doubleword_op;
5489      unsigned long base_offset;
5490 {
5491   int regno;
5492
5493   if (gmask == 0 && fmask == 0)
5494     return;
5495
5496   /* Save registers starting from high to low.  We've already saved the
5497      previous frame pointer and previous return address for the debugger's
5498      sake.  The debugger allows us to not need a nop in the epilog if at least
5499      one register is reloaded in addition to return address.  */
5500
5501   if (gmask)
5502     {
5503       for (regno = 1; regno <= 31; regno++)
5504         {
5505           if ((gmask & (1L << regno)) != 0)
5506             {
5507               if ((regno & 0x1) == 0 && ((gmask & (1L << (regno+1))) != 0))
5508                 {
5509                   /* We can save two registers in a row.  If we're not at a
5510                      double word boundary, move to one.
5511                      sparc_flat_compute_frame_size ensures there's room to do
5512                      this.  */
5513                   if (offset % 8 != 0)
5514                     offset += UNITS_PER_WORD;
5515
5516                   if (word_op[0] == 's')
5517                     {
5518                       fprintf (file, "\t%s %s,[%s+%d]\n",
5519                                doubleword_op, reg_names[regno],
5520                                base_reg, offset);
5521                       if (dwarf2out_do_frame ())
5522                         {
5523                           char *l = dwarf2out_cfi_label ();
5524                           dwarf2out_reg_save (l, regno, offset + base_offset);
5525                           dwarf2out_reg_save
5526                             (l, regno+1, offset+base_offset + UNITS_PER_WORD);
5527                         }
5528                     }
5529                   else
5530                     fprintf (file, "\t%s [%s+%d],%s\n",
5531                              doubleword_op, base_reg, offset,
5532                              reg_names[regno]);
5533
5534                   offset += 2 * UNITS_PER_WORD;
5535                   regno++;
5536                 }
5537               else
5538                 {
5539                   if (word_op[0] == 's')
5540                     {
5541                       fprintf (file, "\t%s %s,[%s+%d]\n",
5542                                word_op, reg_names[regno],
5543                                base_reg, offset);
5544                       if (dwarf2out_do_frame ())
5545                         dwarf2out_reg_save ("", regno, offset + base_offset);
5546                     }
5547                   else
5548                     fprintf (file, "\t%s [%s+%d],%s\n",
5549                              word_op, base_reg, offset, reg_names[regno]);
5550
5551                   offset += UNITS_PER_WORD;
5552                 }
5553             }
5554         }
5555     }
5556
5557   if (fmask)
5558     {
5559       for (regno = 32; regno <= 63; regno++)
5560         {
5561           if ((fmask & (1L << (regno - 32))) != 0)
5562             {
5563               if (word_op[0] == 's')
5564                 {
5565                   fprintf (file, "\t%s %s,[%s+%d]\n",
5566                            word_op, reg_names[regno],
5567                            base_reg, offset);
5568                   if (dwarf2out_do_frame ())
5569                     dwarf2out_reg_save ("", regno, offset + base_offset);
5570                 }
5571               else
5572                 fprintf (file, "\t%s [%s+%d],%s\n",
5573                          word_op, base_reg, offset, reg_names[regno]);
5574
5575               offset += UNITS_PER_WORD;
5576             }
5577         }
5578     }
5579 }
5580 \f
5581 /* Set up the stack and frame (if desired) for the function.  */
5582
5583 void
5584 sparc_flat_output_function_prologue (file, size)
5585      FILE *file;
5586      int size;
5587 {
5588   char *sp_str = reg_names[STACK_POINTER_REGNUM];
5589   unsigned long gmask = current_frame_info.gmask;
5590
5591   /* This is only for the human reader.  */
5592   fprintf (file, "\t%s#PROLOGUE# 0\n", ASM_COMMENT_START);
5593   fprintf (file, "\t%s# vars= %d, regs= %d/%d, args= %d, extra= %d\n",
5594            ASM_COMMENT_START,
5595            current_frame_info.var_size,
5596            current_frame_info.gp_reg_size / 4,
5597            current_frame_info.fp_reg_size / 4,
5598            current_function_outgoing_args_size,
5599            current_frame_info.extra_size);
5600
5601   size = SPARC_STACK_ALIGN (size);
5602   size = (! current_frame_info.initialized
5603           ? sparc_flat_compute_frame_size (size)
5604           : current_frame_info.total_size);
5605
5606   /* These cases shouldn't happen.  Catch them now.  */
5607   if (size == 0 && (gmask || current_frame_info.fmask))
5608     abort ();
5609
5610   /* Allocate our stack frame by decrementing %sp.
5611      At present, the only algorithm gdb can use to determine if this is a
5612      flat frame is if we always set %i7 if we set %sp.  This can be optimized
5613      in the future by putting in some sort of debugging information that says
5614      this is a `flat' function.  However, there is still the case of debugging
5615      code without such debugging information (including cases where most fns
5616      have such info, but there is one that doesn't).  So, always do this now
5617      so we don't get a lot of code out there that gdb can't handle.
5618      If the frame pointer isn't needn't then that's ok - gdb won't be able to
5619      distinguish us from a non-flat function but there won't (and shouldn't)
5620      be any differences anyway.  The return pc is saved (if necessary) right
5621      after %i7 so gdb won't have to look too far to find it.  */
5622   if (size > 0)
5623     {
5624       unsigned int reg_offset = current_frame_info.reg_offset;
5625       char *fp_str = reg_names[FRAME_POINTER_REGNUM];
5626       char *t1_str = "%g1";
5627
5628       /* Things get a little tricky if local variables take up more than ~4096
5629          bytes and outgoing arguments take up more than ~4096 bytes.  When that
5630          happens, the register save area can't be accessed from either end of
5631          the frame.  Handle this by decrementing %sp to the start of the gp
5632          register save area, save the regs, update %i7, and then set %sp to its
5633          final value.  Given that we only have one scratch register to play
5634          with it is the cheapest solution, and it helps gdb out as it won't
5635          slow down recognition of flat functions.
5636          Don't change the order of insns emitted here without checking with
5637          the gdb folk first.  */
5638
5639       /* Is the entire register save area offsettable from %sp?  */
5640       if (reg_offset < 4096 - 64 * UNITS_PER_WORD)
5641         {
5642           if (size <= 4096)
5643             {
5644               fprintf (file, "\tadd %s,%d,%s\n",
5645                        sp_str, -size, sp_str);
5646               if (gmask & FRAME_POINTER_MASK)
5647                 {
5648                   fprintf (file, "\tst %s,[%s+%d]\n",
5649                            fp_str, sp_str, reg_offset);
5650                   fprintf (file, "\tsub %s,%d,%s\t%s# set up frame pointer\n",
5651                            sp_str, -size, fp_str, ASM_COMMENT_START);
5652                   reg_offset += 4;
5653                 }
5654             }
5655           else
5656             {
5657               fprintf (file, "\tset %d,%s\n\tsub %s,%s,%s\n",
5658                        size, t1_str, sp_str, t1_str, sp_str);
5659               if (gmask & FRAME_POINTER_MASK)
5660                 {
5661                   fprintf (file, "\tst %s,[%s+%d]\n",
5662                            fp_str, sp_str, reg_offset);
5663                   fprintf (file, "\tadd %s,%s,%s\t%s# set up frame pointer\n",
5664                            sp_str, t1_str, fp_str, ASM_COMMENT_START);
5665                   reg_offset += 4;
5666                 }
5667             }
5668           if (dwarf2out_do_frame ())
5669             {
5670               char *l = dwarf2out_cfi_label ();
5671               if (gmask & FRAME_POINTER_MASK)
5672                 {
5673                   dwarf2out_reg_save (l, FRAME_POINTER_REGNUM,
5674                                       reg_offset - 4 - size);
5675                   dwarf2out_def_cfa (l, FRAME_POINTER_REGNUM, 0);
5676                 }
5677               else
5678                 dwarf2out_def_cfa (l, STACK_POINTER_REGNUM, size);
5679             }
5680           if (gmask & RETURN_ADDR_MASK)
5681             {
5682               fprintf (file, "\tst %s,[%s+%d]\n",
5683                        reg_names[RETURN_ADDR_REGNUM], sp_str, reg_offset);
5684               if (dwarf2out_do_frame ())
5685                 dwarf2out_return_save ("", reg_offset - size);
5686               reg_offset += 4;
5687             }
5688           sparc_flat_save_restore (file, sp_str, reg_offset,
5689                                    gmask & ~(FRAME_POINTER_MASK | RETURN_ADDR_MASK),
5690                                    current_frame_info.fmask,
5691                                    "st", "std", -size);
5692         }
5693       else
5694         {
5695           /* Subtract %sp in two steps, but make sure there is always a
5696              64 byte register save area, and %sp is properly aligned.  */
5697           /* Amount to decrement %sp by, the first time.  */
5698           unsigned int size1 = ((size - reg_offset + 64) + 15) & -16;
5699           /* Offset to register save area from %sp.  */
5700           unsigned int offset = size1 - (size - reg_offset);
5701
5702           if (size1 <= 4096)
5703             {
5704               fprintf (file, "\tadd %s,%d,%s\n",
5705                        sp_str, -size1, sp_str);
5706               if (gmask & FRAME_POINTER_MASK)
5707                 {
5708                   fprintf (file, "\tst %s,[%s+%d]\n\tsub %s,%d,%s\t%s# set up frame pointer\n",
5709                            fp_str, sp_str, offset, sp_str, -size1, fp_str,
5710                            ASM_COMMENT_START);
5711                   offset += 4;
5712                 }
5713             }
5714           else
5715             {
5716               fprintf (file, "\tset %d,%s\n\tsub %s,%s,%s\n",
5717                        size1, t1_str, sp_str, t1_str, sp_str);
5718               if (gmask & FRAME_POINTER_MASK)
5719                 {
5720                   fprintf (file, "\tst %s,[%s+%d]\n\tadd %s,%s,%s\t%s# set up frame pointer\n",
5721                            fp_str, sp_str, offset, sp_str, t1_str, fp_str,
5722                            ASM_COMMENT_START);
5723                   offset += 4;
5724                 }
5725             }
5726           if (dwarf2out_do_frame ())
5727             {
5728               char *l = dwarf2out_cfi_label ();
5729               if (gmask & FRAME_POINTER_MASK)
5730                 {
5731                   dwarf2out_reg_save (l, FRAME_POINTER_REGNUM,
5732                                       offset - 4 - size1);
5733                   dwarf2out_def_cfa (l, FRAME_POINTER_REGNUM, 0);
5734                 }
5735               else
5736                 dwarf2out_def_cfa (l, STACK_POINTER_REGNUM, size1);
5737             }
5738           if (gmask & RETURN_ADDR_MASK)
5739             {
5740               fprintf (file, "\tst %s,[%s+%d]\n",
5741                        reg_names[RETURN_ADDR_REGNUM], sp_str, offset);
5742               if (dwarf2out_do_frame ())
5743                 /* offset - size1 == reg_offset - size
5744                    if reg_offset were updated above like offset.  */
5745                 dwarf2out_return_save ("", offset - size1);
5746               offset += 4;
5747             }
5748           sparc_flat_save_restore (file, sp_str, offset,
5749                                    gmask & ~(FRAME_POINTER_MASK | RETURN_ADDR_MASK),
5750                                    current_frame_info.fmask,
5751                                    "st", "std", -size1);
5752           fprintf (file, "\tset %d,%s\n\tsub %s,%s,%s\n",
5753                    size - size1, t1_str, sp_str, t1_str, sp_str);
5754           if (dwarf2out_do_frame ())
5755             if (! (gmask & FRAME_POINTER_MASK))
5756               dwarf2out_def_cfa ("", STACK_POINTER_REGNUM, size);
5757         }
5758     }
5759
5760   fprintf (file, "\t%s#PROLOGUE# 1\n", ASM_COMMENT_START);
5761 }
5762 \f
5763 /* Do any necessary cleanup after a function to restore stack, frame,
5764    and regs. */
5765
5766 void
5767 sparc_flat_output_function_epilogue (file, size)
5768      FILE *file;
5769      int size;
5770 {
5771   rtx epilogue_delay = current_function_epilogue_delay_list;
5772   int noepilogue = FALSE;
5773
5774   /* This is only for the human reader.  */
5775   fprintf (file, "\t%s#EPILOGUE#\n", ASM_COMMENT_START);
5776
5777   /* The epilogue does not depend on any registers, but the stack
5778      registers, so we assume that if we have 1 pending nop, it can be
5779      ignored, and 2 it must be filled (2 nops occur for integer
5780      multiply and divide).  */
5781
5782   size = SPARC_STACK_ALIGN (size);
5783   size = (!current_frame_info.initialized
5784            ? sparc_flat_compute_frame_size (size)
5785            : current_frame_info.total_size);
5786
5787   if (size == 0 && epilogue_delay == 0)
5788     {
5789       rtx insn = get_last_insn ();
5790
5791       /* If the last insn was a BARRIER, we don't have to write any code
5792          because a jump (aka return) was put there.  */
5793       if (GET_CODE (insn) == NOTE)
5794         insn = prev_nonnote_insn (insn);
5795       if (insn && GET_CODE (insn) == BARRIER)
5796         noepilogue = TRUE;
5797     }
5798
5799   if (!noepilogue)
5800     {
5801       unsigned int reg_offset = current_frame_info.reg_offset;
5802       unsigned int size1;
5803       char *sp_str = reg_names[STACK_POINTER_REGNUM];
5804       char *fp_str = reg_names[FRAME_POINTER_REGNUM];
5805       char *t1_str = "%g1";
5806
5807       /* In the reload sequence, we don't need to fill the load delay
5808          slots for most of the loads, also see if we can fill the final
5809          delay slot if not otherwise filled by the reload sequence.  */
5810
5811       if (size > 4095)
5812         fprintf (file, "\tset %d,%s\n", size, t1_str);
5813
5814       if (frame_pointer_needed)
5815         {
5816           if (size > 4095)
5817             fprintf (file,"\tsub %s,%s,%s\t\t%s# sp not trusted here\n",
5818                      fp_str, t1_str, sp_str, ASM_COMMENT_START);
5819           else
5820             fprintf (file,"\tsub %s,%d,%s\t\t%s# sp not trusted here\n",
5821                      fp_str, size, sp_str, ASM_COMMENT_START);
5822         }
5823
5824       /* Is the entire register save area offsettable from %sp?  */
5825       if (reg_offset < 4096 - 64 * UNITS_PER_WORD)
5826         {
5827           size1 = 0;
5828         }
5829       else
5830         {
5831           /* Restore %sp in two steps, but make sure there is always a
5832              64 byte register save area, and %sp is properly aligned.  */
5833           /* Amount to increment %sp by, the first time.  */
5834           size1 = ((reg_offset - 64 - 16) + 15) & -16;
5835           /* Offset to register save area from %sp.  */
5836           reg_offset = size1 - reg_offset;
5837
5838           fprintf (file, "\tset %d,%s\n\tadd %s,%s,%s\n",
5839                    size1, t1_str, sp_str, t1_str, sp_str);
5840         }
5841
5842       /* We must restore the frame pointer and return address reg first
5843          because they are treated specially by the prologue output code.  */
5844       if (current_frame_info.gmask & FRAME_POINTER_MASK)
5845         {
5846           fprintf (file, "\tld [%s+%d],%s\n",
5847                    sp_str, reg_offset, fp_str);
5848           reg_offset += 4;
5849         }
5850       if (current_frame_info.gmask & RETURN_ADDR_MASK)
5851         {
5852           fprintf (file, "\tld [%s+%d],%s\n",
5853                    sp_str, reg_offset, reg_names[RETURN_ADDR_REGNUM]);
5854           reg_offset += 4;
5855         }
5856
5857       /* Restore any remaining saved registers.  */
5858       sparc_flat_save_restore (file, sp_str, reg_offset,
5859                                current_frame_info.gmask & ~(FRAME_POINTER_MASK | RETURN_ADDR_MASK),
5860                                current_frame_info.fmask,
5861                                "ld", "ldd", 0);
5862
5863       /* If we had to increment %sp in two steps, record it so the second
5864          restoration in the epilogue finishes up.  */
5865       if (size1 > 0)
5866         {
5867           size -= size1;
5868           if (size > 4095)
5869             fprintf (file, "\tset %d,%s\n",
5870                      size, t1_str);
5871         }
5872
5873       if (current_function_returns_struct)
5874         fprintf (file, "\tjmp %%o7+12\n");
5875       else
5876         fprintf (file, "\tretl\n");
5877
5878       /* If the only register saved is the return address, we need a
5879          nop, unless we have an instruction to put into it.  Otherwise
5880          we don't since reloading multiple registers doesn't reference
5881          the register being loaded.  */
5882
5883       if (epilogue_delay)
5884         {
5885           if (size)
5886             abort ();
5887           final_scan_insn (XEXP (epilogue_delay, 0), file, 1, -2, 1);
5888         }
5889
5890       else if (size > 4095)
5891         fprintf (file, "\tadd %s,%s,%s\n", sp_str, t1_str, sp_str);
5892
5893       else if (size > 0)
5894         fprintf (file, "\tadd %s,%d,%s\n", sp_str, size, sp_str);
5895
5896       else
5897         fprintf (file, "\tnop\n");
5898     }
5899
5900   /* Reset state info for each function.  */
5901   current_frame_info = zero_frame_info;
5902 }
5903 \f
5904 /* Define the number of delay slots needed for the function epilogue.
5905
5906    On the sparc, we need a slot if either no stack has been allocated,
5907    or the only register saved is the return register.  */
5908
5909 int
5910 sparc_flat_epilogue_delay_slots ()
5911 {
5912   if (!current_frame_info.initialized)
5913     (void) sparc_flat_compute_frame_size (get_frame_size ());
5914
5915   if (current_frame_info.total_size == 0)
5916     return 1;
5917
5918   return 0;
5919 }
5920
5921 /* Return true is TRIAL is a valid insn for the epilogue delay slot.
5922    Any single length instruction which doesn't reference the stack or frame
5923    pointer is OK.  */
5924
5925 int
5926 sparc_flat_eligible_for_epilogue_delay (trial, slot)
5927      rtx trial;
5928      int slot;
5929 {
5930   rtx pat = PATTERN (trial);
5931
5932   if (get_attr_length (trial) != 1)
5933     return 0;
5934
5935   /* If %g0 is live, there are lots of things we can't handle.
5936      Rather than trying to find them all now, let's punt and only
5937      optimize things as necessary.  */
5938   if (TARGET_LIVE_G0)
5939     return 0;
5940
5941   if (! reg_mentioned_p (stack_pointer_rtx, pat)
5942       && ! reg_mentioned_p (frame_pointer_rtx, pat))
5943     return 1;
5944
5945   return 0;
5946 }
5947 \f
5948 /* Adjust the cost of a scheduling dependency.  Return the new cost of
5949    a dependency LINK or INSN on DEP_INSN.  COST is the current cost.  */
5950
5951 int
5952 supersparc_adjust_cost (insn, link, dep_insn, cost)
5953      rtx insn;
5954      rtx link;
5955      rtx dep_insn;
5956      int cost;
5957 {
5958   enum attr_type insn_type;
5959
5960   if (! recog_memoized (insn))
5961     return 0;
5962
5963   insn_type = get_attr_type (insn);
5964
5965   if (REG_NOTE_KIND (link) == 0)
5966     {
5967       /* Data dependency; DEP_INSN writes a register that INSN reads some
5968          cycles later.  */
5969
5970       /* if a load, then the dependence must be on the memory address;
5971          add an extra 'cycle'.  Note that the cost could be two cycles
5972          if the reg was written late in an instruction group; we can't tell
5973          here.  */
5974       if (insn_type == TYPE_LOAD || insn_type == TYPE_FPLOAD)
5975         return cost + 3;
5976
5977       /* Get the delay only if the address of the store is the dependence.  */
5978       if (insn_type == TYPE_STORE || insn_type == TYPE_FPSTORE)
5979         {
5980           rtx pat = PATTERN(insn);
5981           rtx dep_pat = PATTERN (dep_insn);
5982
5983           if (GET_CODE (pat) != SET || GET_CODE (dep_pat) != SET)
5984             return cost;  /* This shouldn't happen!  */
5985
5986           /* The dependency between the two instructions was on the data that
5987              is being stored.  Assume that this implies that the address of the
5988              store is not dependent.  */
5989           if (rtx_equal_p (SET_DEST (dep_pat), SET_SRC (pat)))
5990             return cost;
5991
5992           return cost + 3;  /* An approximation.  */
5993         }
5994
5995       /* A shift instruction cannot receive its data from an instruction
5996          in the same cycle; add a one cycle penalty.  */
5997       if (insn_type == TYPE_SHIFT)
5998         return cost + 3;   /* Split before cascade into shift.  */
5999     }
6000   else
6001     {
6002       /* Anti- or output- dependency; DEP_INSN reads/writes a register that
6003          INSN writes some cycles later.  */
6004
6005       /* These are only significant for the fpu unit; writing a fp reg before
6006          the fpu has finished with it stalls the processor.  */
6007
6008       /* Reusing an integer register causes no problems.  */
6009       if (insn_type == TYPE_IALU || insn_type == TYPE_SHIFT)
6010         return 0;
6011     }
6012
6013   return cost;
6014 }