gdbserver/linux-aarch64-low.cc

   1 /* GNU/Linux/AArch64 specific low level interface, for the remote server for
   2    GDB.
   3
   4    Copyright (C) 2009-2024 Free Software Foundation, Inc.
   5    Contributed by ARM Ltd.
   6
   7    This file is part of GDB.
   8
   9    This program is free software; you can redistribute it and/or modify
  10    it under the terms of the GNU General Public License as published by
  11    the Free Software Foundation; either version 3 of the License, or
  12    (at your option) any later version.
  13
  14    This program is distributed in the hope that it will be useful,
  15    but WITHOUT ANY WARRANTY; without even the implied warranty of
  16    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  17    GNU General Public License for more details.
  18
  19    You should have received a copy of the GNU General Public License
  20    along with this program.  If not, see <http://www.gnu.org/licenses/>.  */
  21
  22 #include "server.h"
  23 #include "linux-low.h"
  24 #include "nat/aarch64-linux.h"
  25 #include "nat/aarch64-linux-hw-point.h"
  26 #include "arch/aarch64-insn.h"
  27 #include "linux-aarch32-low.h"
  28 #include "elf/common.h"
  29 #include "ax.h"
  30 #include "tracepoint.h"
  31 #include "debug.h"
  32
  33 #include <signal.h>
  34 #include <sys/user.h>
  35 #include "nat/gdb_ptrace.h"
  36 #include <asm/ptrace.h>
  37 #include <inttypes.h>
  38 #include <endian.h>
  39 #include <sys/uio.h>
  40
  41 #include "gdb_proc_service.h"
  42 #include "arch/aarch64.h"
  43 #include "arch/aarch64-mte-linux.h"
  44 #include "arch/aarch64-scalable-linux.h"
  45 #include "linux-aarch32-tdesc.h"
  46 #include "linux-aarch64-tdesc.h"
  47 #include "nat/aarch64-mte-linux-ptrace.h"
  48 #include "nat/aarch64-scalable-linux-ptrace.h"
  49 #include "tdesc.h"
  50
  51 #ifdef HAVE_SYS_REG_H
  52 #include <sys/reg.h>
  53 #endif
  54
  55 #ifdef HAVE_GETAUXVAL
  56 #include <sys/auxv.h>
  57 #endif
  58
  59 /* Linux target op definitions for the AArch64 architecture.  */
  60
  61 class aarch64_target : public linux_process_target
  62 {
  63 public:
  64
  65   const regs_info *get_regs_info () override;
  66
  67   int breakpoint_kind_from_pc (CORE_ADDR *pcptr) override;
  68
  69   int breakpoint_kind_from_current_state (CORE_ADDR *pcptr) override;
  70
  71   const gdb_byte *sw_breakpoint_from_kind (int kind, int *size) override;
  72
  73   bool supports_z_point_type (char z_type) override;
  74
  75   bool supports_tracepoints () override;
  76
  77   bool supports_fast_tracepoints () override;
  78
  79   int install_fast_tracepoint_jump_pad
  80     (CORE_ADDR tpoint, CORE_ADDR tpaddr, CORE_ADDR collector,
  81      CORE_ADDR lockaddr, ULONGEST orig_size, CORE_ADDR *jump_entry,
  82      CORE_ADDR *trampoline, ULONGEST *trampoline_size,
  83      unsigned char *jjump_pad_insn, ULONGEST *jjump_pad_insn_size,
  84      CORE_ADDR *adjusted_insn_addr, CORE_ADDR *adjusted_insn_addr_end,
  85      char *err) override;
  86
  87   int get_min_fast_tracepoint_insn_len () override;
  88
  89   struct emit_ops *emit_ops () override;
  90
  91   bool supports_memory_tagging () override;
  92
  93   bool fetch_memtags (CORE_ADDR address, size_t len,
  94                       gdb::byte_vector &tags, int type) override;
  95
  96   bool store_memtags (CORE_ADDR address, size_t len,
  97                       const gdb::byte_vector &tags, int type) override;
  98
  99 protected:
 100
 101   void low_arch_setup () override;
 102
 103   bool low_cannot_fetch_register (int regno) override;
 104
 105   bool low_cannot_store_register (int regno) override;
 106
 107   bool low_supports_breakpoints () override;
 108
 109   CORE_ADDR low_get_pc (regcache *regcache) override;
 110
 111   void low_set_pc (regcache *regcache, CORE_ADDR newpc) override;
 112
 113   bool low_breakpoint_at (CORE_ADDR pc) override;
 114
 115   int low_insert_point (raw_bkpt_type type, CORE_ADDR addr,
 116                         int size, raw_breakpoint *bp) override;
 117
 118   int low_remove_point (raw_bkpt_type type, CORE_ADDR addr,
 119                         int size, raw_breakpoint *bp) override;
 120
 121   bool low_stopped_by_watchpoint () override;
 122
 123   CORE_ADDR low_stopped_data_address () override;
 124
 125   bool low_siginfo_fixup (siginfo_t *native, gdb_byte *inf,
 126                           int direction) override;
 127
 128   arch_process_info *low_new_process () override;
 129
 130   void low_delete_process (arch_process_info *info) override;
 131
 132   void low_new_thread (lwp_info *) override;
 133
 134   void low_delete_thread (arch_lwp_info *) override;
 135
 136   void low_new_fork (process_info *parent, process_info *child) override;
 137
 138   void low_prepare_to_resume (lwp_info *lwp) override;
 139
 140   int low_get_thread_area (int lwpid, CORE_ADDR *addrp) override;
 141
 142   bool low_supports_range_stepping () override;
 143
 144   bool low_supports_catch_syscall () override;
 145
 146   void low_get_syscall_trapinfo (regcache *regcache, int *sysno) override;
 147 };
 148
 149 /* The singleton target ops object.  */
 150
 151 static aarch64_target the_aarch64_target;
 152
 153 bool
 154 aarch64_target::low_cannot_fetch_register (int regno)
 155 {
 156   gdb_assert_not_reached ("linux target op low_cannot_fetch_register "
 157                           "is not implemented by the target");
 158 }
 159
 160 bool
 161 aarch64_target::low_cannot_store_register (int regno)
 162 {
 163   gdb_assert_not_reached ("linux target op low_cannot_store_register "
 164                           "is not implemented by the target");
 165 }
 166
 167 void
 168 aarch64_target::low_prepare_to_resume (lwp_info *lwp)
 169 {
 170   aarch64_linux_prepare_to_resume (lwp);
 171 }
 172
 173 /* Per-process arch-specific data we want to keep.  */
 174
 175 struct arch_process_info
 176 {
 177   /* Hardware breakpoint/watchpoint data.
 178      The reason for them to be per-process rather than per-thread is
 179      due to the lack of information in the gdbserver environment;
 180      gdbserver is not told that whether a requested hardware
 181      breakpoint/watchpoint is thread specific or not, so it has to set
 182      each hw bp/wp for every thread in the current process.  The
 183      higher level bp/wp management in gdb will resume a thread if a hw
 184      bp/wp trap is not expected for it.  Since the hw bp/wp setting is
 185      same for each thread, it is reasonable for the data to live here.
 186      */
 187   struct aarch64_debug_reg_state debug_reg_state;
 188 };
 189
 190 /* Return true if the size of register 0 is 8 byte.  */
 191
 192 static int
 193 is_64bit_tdesc (void)
 194 {
 195   /* We may not have a current thread at this point, so go straight to
 196      the process's target description.  */
 197   return register_size (current_process ()->tdesc, 0) == 8;
 198 }
 199
 200 static void
 201 aarch64_fill_gregset (struct regcache *regcache, void *buf)
 202 {
 203   struct user_pt_regs *regset = (struct user_pt_regs *) buf;
 204   int i;
 205
 206   for (i = 0; i < AARCH64_X_REGS_NUM; i++)
 207     collect_register (regcache, AARCH64_X0_REGNUM + i, &regset->regs[i]);
 208   collect_register (regcache, AARCH64_SP_REGNUM, &regset->sp);
 209   collect_register (regcache, AARCH64_PC_REGNUM, &regset->pc);
 210   collect_register (regcache, AARCH64_CPSR_REGNUM, &regset->pstate);
 211 }
 212
 213 static void
 214 aarch64_store_gregset (struct regcache *regcache, const void *buf)
 215 {
 216   const struct user_pt_regs *regset = (const struct user_pt_regs *) buf;
 217   int i;
 218
 219   for (i = 0; i < AARCH64_X_REGS_NUM; i++)
 220     supply_register (regcache, AARCH64_X0_REGNUM + i, &regset->regs[i]);
 221   supply_register (regcache, AARCH64_SP_REGNUM, &regset->sp);
 222   supply_register (regcache, AARCH64_PC_REGNUM, &regset->pc);
 223   supply_register (regcache, AARCH64_CPSR_REGNUM, &regset->pstate);
 224 }
 225
 226 static void
 227 aarch64_fill_fpregset (struct regcache *regcache, void *buf)
 228 {
 229   struct user_fpsimd_state *regset = (struct user_fpsimd_state *) buf;
 230   int i;
 231
 232   for (i = 0; i < AARCH64_V_REGS_NUM; i++)
 233     collect_register (regcache, AARCH64_V0_REGNUM + i, &regset->vregs[i]);
 234   collect_register (regcache, AARCH64_FPSR_REGNUM, &regset->fpsr);
 235   collect_register (regcache, AARCH64_FPCR_REGNUM, &regset->fpcr);
 236 }
 237
 238 static void
 239 aarch64_store_fpregset (struct regcache *regcache, const void *buf)
 240 {
 241   const struct user_fpsimd_state *regset
 242     = (const struct user_fpsimd_state *) buf;
 243   int i;
 244
 245   for (i = 0; i < AARCH64_V_REGS_NUM; i++)
 246     supply_register (regcache, AARCH64_V0_REGNUM + i, &regset->vregs[i]);
 247   supply_register (regcache, AARCH64_FPSR_REGNUM, &regset->fpsr);
 248   supply_register (regcache, AARCH64_FPCR_REGNUM, &regset->fpcr);
 249 }
 250
 251 /* Store the pauth registers to regcache.  */
 252
 253 static void
 254 aarch64_store_pauthregset (struct regcache *regcache, const void *buf)
 255 {
 256   uint64_t *pauth_regset = (uint64_t *) buf;
 257   int pauth_base = find_regno (regcache->tdesc, "pauth_dmask");
 258
 259   if (pauth_base == 0)
 260     return;
 261
 262   supply_register (regcache, AARCH64_PAUTH_DMASK_REGNUM (pauth_base),
 263                    &pauth_regset[0]);
 264   supply_register (regcache, AARCH64_PAUTH_CMASK_REGNUM (pauth_base),
 265                    &pauth_regset[1]);
 266 }
 267
 268 /* Fill BUF with the MTE registers from the regcache.  */
 269
 270 static void
 271 aarch64_fill_mteregset (struct regcache *regcache, void *buf)
 272 {
 273   uint64_t *mte_regset = (uint64_t *) buf;
 274   int mte_base = find_regno (regcache->tdesc, "tag_ctl");
 275
 276   collect_register (regcache, mte_base, mte_regset);
 277 }
 278
 279 /* Store the MTE registers to regcache.  */
 280
 281 static void
 282 aarch64_store_mteregset (struct regcache *regcache, const void *buf)
 283 {
 284   uint64_t *mte_regset = (uint64_t *) buf;
 285   int mte_base = find_regno (regcache->tdesc, "tag_ctl");
 286
 287   /* Tag Control register */
 288   supply_register (regcache, mte_base, mte_regset);
 289 }
 290
 291 /* Fill BUF with TLS register from the regcache.  */
 292
 293 static void
 294 aarch64_fill_tlsregset (struct regcache *regcache, void *buf)
 295 {
 296   gdb_byte *tls_buf = (gdb_byte *) buf;
 297   int tls_regnum  = find_regno (regcache->tdesc, "tpidr");
 298
 299   collect_register (regcache, tls_regnum, tls_buf);
 300
 301   /* Read TPIDR2, if it exists.  */
 302   std::optional<int> regnum = find_regno_no_throw (regcache->tdesc, "tpidr2");
 303
 304   if (regnum.has_value ())
 305     collect_register (regcache, *regnum, tls_buf + sizeof (uint64_t));
 306 }
 307
 308 /* Store TLS register to regcache.  */
 309
 310 static void
 311 aarch64_store_tlsregset (struct regcache *regcache, const void *buf)
 312 {
 313   gdb_byte *tls_buf = (gdb_byte *) buf;
 314   int tls_regnum  = find_regno (regcache->tdesc, "tpidr");
 315
 316   supply_register (regcache, tls_regnum, tls_buf);
 317
 318   /* Write TPIDR2, if it exists.  */
 319   std::optional<int> regnum = find_regno_no_throw (regcache->tdesc, "tpidr2");
 320
 321   if (regnum.has_value ())
 322     supply_register (regcache, *regnum, tls_buf + sizeof (uint64_t));
 323 }
 324
 325 bool
 326 aarch64_target::low_supports_breakpoints ()
 327 {
 328   return true;
 329 }
 330
 331 /* Implementation of linux target ops method "low_get_pc".  */
 332
 333 CORE_ADDR
 334 aarch64_target::low_get_pc (regcache *regcache)
 335 {
 336   if (register_size (regcache->tdesc, 0) == 8)
 337     return linux_get_pc_64bit (regcache);
 338   else
 339     return linux_get_pc_32bit (regcache);
 340 }
 341
 342 /* Implementation of linux target ops method "low_set_pc".  */
 343
 344 void
 345 aarch64_target::low_set_pc (regcache *regcache, CORE_ADDR pc)
 346 {
 347   if (register_size (regcache->tdesc, 0) == 8)
 348     linux_set_pc_64bit (regcache, pc);
 349   else
 350     linux_set_pc_32bit (regcache, pc);
 351 }
 352
 353 #define aarch64_breakpoint_len 4
 354
 355 /* AArch64 BRK software debug mode instruction.
 356    This instruction needs to match gdb/aarch64-tdep.c
 357    (aarch64_default_breakpoint).  */
 358 static const gdb_byte aarch64_breakpoint[] = {0x00, 0x00, 0x20, 0xd4};
 359
 360 /* Implementation of linux target ops method "low_breakpoint_at".  */
 361
 362 bool
 363 aarch64_target::low_breakpoint_at (CORE_ADDR where)
 364 {
 365   if (is_64bit_tdesc ())
 366     {
 367       gdb_byte insn[aarch64_breakpoint_len];
 368
 369       read_memory (where, (unsigned char *) &insn, aarch64_breakpoint_len);
 370       if (memcmp (insn, aarch64_breakpoint, aarch64_breakpoint_len) == 0)
 371         return true;
 372
 373       return false;
 374     }
 375   else
 376     return arm_breakpoint_at (where);
 377 }
 378
 379 static void
 380 aarch64_init_debug_reg_state (struct aarch64_debug_reg_state *state)
 381 {
 382   int i;
 383
 384   for (i = 0; i < AARCH64_HBP_MAX_NUM; ++i)
 385     {
 386       state->dr_addr_bp[i] = 0;
 387       state->dr_ctrl_bp[i] = 0;
 388       state->dr_ref_count_bp[i] = 0;
 389     }
 390
 391   for (i = 0; i < AARCH64_HWP_MAX_NUM; ++i)
 392     {
 393       state->dr_addr_wp[i] = 0;
 394       state->dr_ctrl_wp[i] = 0;
 395       state->dr_ref_count_wp[i] = 0;
 396     }
 397 }
 398
 399 /* Return the pointer to the debug register state structure in the
 400    current process' arch-specific data area.  */
 401
 402 struct aarch64_debug_reg_state *
 403 aarch64_get_debug_reg_state (pid_t pid)
 404 {
 405   struct process_info *proc = find_process_pid (pid);
 406
 407   return &proc->priv->arch_private->debug_reg_state;
 408 }
 409
 410 /* Implementation of target ops method "supports_z_point_type".  */
 411
 412 bool
 413 aarch64_target::supports_z_point_type (char z_type)
 414 {
 415   switch (z_type)
 416     {
 417     case Z_PACKET_SW_BP:
 418     case Z_PACKET_HW_BP:
 419     case Z_PACKET_WRITE_WP:
 420     case Z_PACKET_READ_WP:
 421     case Z_PACKET_ACCESS_WP:
 422       return true;
 423     default:
 424       return false;
 425     }
 426 }
 427
 428 /* Implementation of linux target ops method "low_insert_point".
 429
 430    It actually only records the info of the to-be-inserted bp/wp;
 431    the actual insertion will happen when threads are resumed.  */
 432
 433 int
 434 aarch64_target::low_insert_point (raw_bkpt_type type, CORE_ADDR addr,
 435                                   int len, raw_breakpoint *bp)
 436 {
 437   int ret;
 438   enum target_hw_bp_type targ_type;
 439   struct aarch64_debug_reg_state *state
 440     = aarch64_get_debug_reg_state (pid_of (current_thread));
 441
 442   if (show_debug_regs)
 443     fprintf (stderr, "insert_point on entry (addr=0x%08lx, len=%d)\n",
 444              (unsigned long) addr, len);
 445
 446   /* Determine the type from the raw breakpoint type.  */
 447   targ_type = raw_bkpt_type_to_target_hw_bp_type (type);
 448
 449   if (targ_type != hw_execute)
 450     {
 451       if (aarch64_region_ok_for_watchpoint (addr, len))
 452         ret = aarch64_handle_watchpoint (targ_type, addr, len,
 453                                          1 /* is_insert */,
 454                                          current_lwp_ptid (), state);
 455       else
 456         ret = -1;
 457     }
 458   else
 459     {
 460       if (len == 3)
 461         {
 462           /* LEN is 3 means the breakpoint is set on a 32-bit thumb
 463              instruction.   Set it to 2 to correctly encode length bit
 464              mask in hardware/watchpoint control register.  */
 465           len = 2;
 466         }
 467       ret = aarch64_handle_breakpoint (targ_type, addr, len,
 468                                        1 /* is_insert */, current_lwp_ptid (),
 469                                        state);
 470     }
 471
 472   if (show_debug_regs)
 473     aarch64_show_debug_reg_state (state, "insert_point", addr, len,
 474                                   targ_type);
 475
 476   return ret;
 477 }
 478
 479 /* Implementation of linux target ops method "low_remove_point".
 480
 481    It actually only records the info of the to-be-removed bp/wp,
 482    the actual removal will be done when threads are resumed.  */
 483
 484 int
 485 aarch64_target::low_remove_point (raw_bkpt_type type, CORE_ADDR addr,
 486                                   int len, raw_breakpoint *bp)
 487 {
 488   int ret;
 489   enum target_hw_bp_type targ_type;
 490   struct aarch64_debug_reg_state *state
 491     = aarch64_get_debug_reg_state (pid_of (current_thread));
 492
 493   if (show_debug_regs)
 494     fprintf (stderr, "remove_point on entry (addr=0x%08lx, len=%d)\n",
 495              (unsigned long) addr, len);
 496
 497   /* Determine the type from the raw breakpoint type.  */
 498   targ_type = raw_bkpt_type_to_target_hw_bp_type (type);
 499
 500   /* Set up state pointers.  */
 501   if (targ_type != hw_execute)
 502     ret =
 503       aarch64_handle_watchpoint (targ_type, addr, len, 0 /* is_insert */,
 504                                  current_lwp_ptid (), state);
 505   else
 506     {
 507       if (len == 3)
 508         {
 509           /* LEN is 3 means the breakpoint is set on a 32-bit thumb
 510              instruction.   Set it to 2 to correctly encode length bit
 511              mask in hardware/watchpoint control register.  */
 512           len = 2;
 513         }
 514       ret = aarch64_handle_breakpoint (targ_type, addr, len,
 515                                        0 /* is_insert */,  current_lwp_ptid (),
 516                                        state);
 517     }
 518
 519   if (show_debug_regs)
 520     aarch64_show_debug_reg_state (state, "remove_point", addr, len,
 521                                   targ_type);
 522
 523   return ret;
 524 }
 525
 526 static CORE_ADDR
 527 aarch64_remove_non_address_bits (CORE_ADDR pointer)
 528 {
 529   /* By default, we assume TBI and discard the top 8 bits plus the
 530      VA range select bit (55).  */
 531   CORE_ADDR mask = AARCH64_TOP_BITS_MASK;
 532
 533   /* Check if PAC is available for this target.  */
 534   if (tdesc_contains_feature (current_process ()->tdesc,
 535                               "org.gnu.gdb.aarch64.pauth"))
 536     {
 537       /* Fetch the PAC masks.  These masks are per-process, so we can just
 538          fetch data from whatever thread we have at the moment.
 539
 540          Also, we have both a code mask and a data mask.  For now they are the
 541          same, but this may change in the future.  */
 542
 543       struct regcache *regs = get_thread_regcache (current_thread, 1);
 544       CORE_ADDR dmask = regcache_raw_get_unsigned_by_name (regs, "pauth_dmask");
 545       CORE_ADDR cmask = regcache_raw_get_unsigned_by_name (regs, "pauth_cmask");
 546       mask |= aarch64_mask_from_pac_registers (cmask, dmask);
 547     }
 548
 549   return aarch64_remove_top_bits (pointer, mask);
 550 }
 551
 552 /* Implementation of linux target ops method "low_stopped_data_address".  */
 553
 554 CORE_ADDR
 555 aarch64_target::low_stopped_data_address ()
 556 {
 557   siginfo_t siginfo;
 558   int pid, i;
 559   struct aarch64_debug_reg_state *state;
 560
 561   pid = lwpid_of (current_thread);
 562
 563   /* Get the siginfo.  */
 564   if (ptrace (PTRACE_GETSIGINFO, pid, NULL, &siginfo) != 0)
 565     return (CORE_ADDR) 0;
 566
 567   /* Need to be a hardware breakpoint/watchpoint trap.  */
 568   if (siginfo.si_signo != SIGTRAP
 569       || (siginfo.si_code & 0xffff) != 0x0004 /* TRAP_HWBKPT */)
 570     return (CORE_ADDR) 0;
 571
 572   /* Make sure to ignore the top byte, otherwise we may not recognize a
 573      hardware watchpoint hit.  The stopped data addresses coming from the
 574      kernel can potentially be tagged addresses.  */
 575   const CORE_ADDR addr_trap
 576     = aarch64_remove_non_address_bits ((CORE_ADDR) siginfo.si_addr);
 577
 578   /* Check if the address matches any watched address.  */
 579   state = aarch64_get_debug_reg_state (pid_of (current_thread));
 580   for (i = aarch64_num_wp_regs - 1; i >= 0; --i)
 581     {
 582       const unsigned int offset
 583         = aarch64_watchpoint_offset (state->dr_ctrl_wp[i]);
 584       const unsigned int len = aarch64_watchpoint_length (state->dr_ctrl_wp[i]);
 585       const CORE_ADDR addr_watch = state->dr_addr_wp[i] + offset;
 586       const CORE_ADDR addr_watch_aligned = align_down (state->dr_addr_wp[i], 8);
 587       const CORE_ADDR addr_orig = state->dr_addr_orig_wp[i];
 588
 589       if (state->dr_ref_count_wp[i]
 590           && DR_CONTROL_ENABLED (state->dr_ctrl_wp[i])
 591           && addr_trap >= addr_watch_aligned
 592           && addr_trap < addr_watch + len)
 593         {
 594           /* ADDR_TRAP reports the first address of the memory range
 595              accessed by the CPU, regardless of what was the memory
 596              range watched.  Thus, a large CPU access that straddles
 597              the ADDR_WATCH..ADDR_WATCH+LEN range may result in an
 598              ADDR_TRAP that is lower than the
 599              ADDR_WATCH..ADDR_WATCH+LEN range.  E.g.:
 600
 601              addr: |   4   |   5   |   6   |   7   |   8   |
 602                                    |---- range watched ----|
 603                    |----------- range accessed ------------|
 604
 605              In this case, ADDR_TRAP will be 4.
 606
 607              To match a watchpoint known to GDB core, we must never
 608              report *ADDR_P outside of any ADDR_WATCH..ADDR_WATCH+LEN
 609              range.  ADDR_WATCH <= ADDR_TRAP < ADDR_ORIG is a false
 610              positive on kernels older than 4.10.  See PR
 611              external/20207.  */
 612           return addr_orig;
 613         }
 614     }
 615
 616   return (CORE_ADDR) 0;
 617 }
 618
 619 /* Implementation of linux target ops method "low_stopped_by_watchpoint".  */
 620
 621 bool
 622 aarch64_target::low_stopped_by_watchpoint ()
 623 {
 624   return (low_stopped_data_address () != 0);
 625 }
 626
 627 /* Fetch the thread-local storage pointer for libthread_db.  */
 628
 629 ps_err_e
 630 ps_get_thread_area (struct ps_prochandle *ph,
 631                     lwpid_t lwpid, int idx, void **base)
 632 {
 633   return aarch64_ps_get_thread_area (ph, lwpid, idx, base,
 634                                      is_64bit_tdesc ());
 635 }
 636
 637 /* Implementation of linux target ops method "low_siginfo_fixup".  */
 638
 639 bool
 640 aarch64_target::low_siginfo_fixup (siginfo_t *native, gdb_byte *inf,
 641                                    int direction)
 642 {
 643   /* Is the inferior 32-bit?  If so, then fixup the siginfo object.  */
 644   if (!is_64bit_tdesc ())
 645     {
 646       if (direction == 0)
 647         aarch64_compat_siginfo_from_siginfo ((struct compat_siginfo *) inf,
 648                                              native);
 649       else
 650         aarch64_siginfo_from_compat_siginfo (native,
 651                                              (struct compat_siginfo *) inf);
 652
 653       return true;
 654     }
 655
 656   return false;
 657 }
 658
 659 /* Implementation of linux target ops method "low_new_process".  */
 660
 661 arch_process_info *
 662 aarch64_target::low_new_process ()
 663 {
 664   struct arch_process_info *info = XCNEW (struct arch_process_info);
 665
 666   aarch64_init_debug_reg_state (&info->debug_reg_state);
 667
 668   return info;
 669 }
 670
 671 /* Implementation of linux target ops method "low_delete_process".  */
 672
 673 void
 674 aarch64_target::low_delete_process (arch_process_info *info)
 675 {
 676   xfree (info);
 677 }
 678
 679 void
 680 aarch64_target::low_new_thread (lwp_info *lwp)
 681 {
 682   aarch64_linux_new_thread (lwp);
 683 }
 684
 685 void
 686 aarch64_target::low_delete_thread (arch_lwp_info *arch_lwp)
 687 {
 688   aarch64_linux_delete_thread (arch_lwp);
 689 }
 690
 691 /* Implementation of linux target ops method "low_new_fork".  */
 692
 693 void
 694 aarch64_target::low_new_fork (process_info *parent,
 695                               process_info *child)
 696 {
 697   /* These are allocated by linux_add_process.  */
 698   gdb_assert (parent->priv != NULL
 699               && parent->priv->arch_private != NULL);
 700   gdb_assert (child->priv != NULL
 701               && child->priv->arch_private != NULL);
 702
 703   /* Linux kernel before 2.6.33 commit
 704      72f674d203cd230426437cdcf7dd6f681dad8b0d
 705      will inherit hardware debug registers from parent
 706      on fork/vfork/clone.  Newer Linux kernels create such tasks with
 707      zeroed debug registers.
 708
 709      GDB core assumes the child inherits the watchpoints/hw
 710      breakpoints of the parent, and will remove them all from the
 711      forked off process.  Copy the debug registers mirrors into the
 712      new process so that all breakpoints and watchpoints can be
 713      removed together.  The debug registers mirror will become zeroed
 714      in the end before detaching the forked off process, thus making
 715      this compatible with older Linux kernels too.  */
 716
 717   *child->priv->arch_private = *parent->priv->arch_private;
 718 }
 719
 720 /* Wrapper for aarch64_sve_regs_copy_to_reg_buf.  */
 721
 722 static void
 723 aarch64_sve_regs_copy_to_regcache (struct regcache *regcache,
 724                                    ATTRIBUTE_UNUSED const void *buf)
 725 {
 726   /* BUF is unused here since we collect the data straight from a ptrace
 727      request in aarch64_sve_regs_copy_to_reg_buf, therefore bypassing
 728      gdbserver's own call to ptrace.  */
 729
 730   int tid = lwpid_of (current_thread);
 731
 732   /* Update the register cache.  aarch64_sve_regs_copy_to_reg_buf handles
 733      fetching the NT_ARM_SVE state from thread TID.  */
 734   aarch64_sve_regs_copy_to_reg_buf (tid, regcache);
 735 }
 736
 737 /* Wrapper for aarch64_sve_regs_copy_from_reg_buf.  */
 738
 739 static void
 740 aarch64_sve_regs_copy_from_regcache (struct regcache *regcache, void *buf)
 741 {
 742   int tid = lwpid_of (current_thread);
 743
 744   /* Update the thread SVE state.  aarch64_sve_regs_copy_from_reg_buf
 745      handles writing the SVE/FPSIMD state back to thread TID.  */
 746   aarch64_sve_regs_copy_from_reg_buf (tid, regcache);
 747
 748   /* We need to return the expected data in BUF, so copy whatever the kernel
 749      already has to BUF.  */
 750   gdb::byte_vector sve_state = aarch64_fetch_sve_regset (tid);
 751   memcpy (buf, sve_state.data (), sve_state.size ());
 752 }
 753
 754 /* Wrapper for aarch64_za_regs_copy_to_reg_buf, to help copying NT_ARM_ZA
 755    state from the thread (BUF) to the register cache.  */
 756
 757 static void
 758 aarch64_za_regs_copy_to_regcache (struct regcache *regcache,
 759                                   ATTRIBUTE_UNUSED const void *buf)
 760 {
 761   /* BUF is unused here since we collect the data straight from a ptrace
 762      request, therefore bypassing gdbserver's own call to ptrace.  */
 763   int tid = lwpid_of (current_thread);
 764
 765   int za_regnum = find_regno (regcache->tdesc, "za");
 766   int svg_regnum = find_regno (regcache->tdesc, "svg");
 767   int svcr_regnum = find_regno (regcache->tdesc, "svcr");
 768
 769   /* Update the register cache.  aarch64_za_regs_copy_to_reg_buf handles
 770      fetching the NT_ARM_ZA state from thread TID.  */
 771   aarch64_za_regs_copy_to_reg_buf (tid, regcache, za_regnum, svg_regnum,
 772                                    svcr_regnum);
 773 }
 774
 775 /* Wrapper for aarch64_za_regs_copy_from_reg_buf, to help copying NT_ARM_ZA
 776    state from the register cache to the thread (BUF).  */
 777
 778 static void
 779 aarch64_za_regs_copy_from_regcache (struct regcache *regcache, void *buf)
 780 {
 781   int tid = lwpid_of (current_thread);
 782
 783   int za_regnum = find_regno (regcache->tdesc, "za");
 784   int svg_regnum = find_regno (regcache->tdesc, "svg");
 785   int svcr_regnum = find_regno (regcache->tdesc, "svcr");
 786
 787   /* Update the thread NT_ARM_ZA state.  aarch64_za_regs_copy_from_reg_buf
 788      handles writing the ZA state back to thread TID.  */
 789   aarch64_za_regs_copy_from_reg_buf (tid, regcache, za_regnum, svg_regnum,
 790                                      svcr_regnum);
 791
 792   /* We need to return the expected data in BUF, so copy whatever the kernel
 793      already has to BUF.  */
 794
 795   /* Obtain a dump of ZA from ptrace.  */
 796   gdb::byte_vector za_state = aarch64_fetch_za_regset (tid);
 797   memcpy (buf, za_state.data (), za_state.size ());
 798 }
 799
 800 /* Wrapper for aarch64_zt_regs_copy_to_reg_buf, to help copying NT_ARM_ZT
 801    state from the thread (BUF) to the register cache.  */
 802
 803 static void
 804 aarch64_zt_regs_copy_to_regcache (struct regcache *regcache,
 805                                   ATTRIBUTE_UNUSED const void *buf)
 806 {
 807   /* BUF is unused here since we collect the data straight from a ptrace
 808      request, therefore bypassing gdbserver's own call to ptrace.  */
 809   int tid = lwpid_of (current_thread);
 810
 811   int zt_regnum = find_regno (regcache->tdesc, "zt0");
 812
 813   /* Update the register cache.  aarch64_zt_regs_copy_to_reg_buf handles
 814      fetching the NT_ARM_ZT state from thread TID.  */
 815   aarch64_zt_regs_copy_to_reg_buf (tid, regcache, zt_regnum);
 816 }
 817
 818 /* Wrapper for aarch64_zt_regs_copy_from_reg_buf, to help copying NT_ARM_ZT
 819    state from the register cache to the thread (BUF).  */
 820
 821 static void
 822 aarch64_zt_regs_copy_from_regcache (struct regcache *regcache, void *buf)
 823 {
 824   int tid = lwpid_of (current_thread);
 825
 826   int zt_regnum = find_regno (regcache->tdesc, "zt0");
 827
 828   /* Update the thread NT_ARM_ZT state.  aarch64_zt_regs_copy_from_reg_buf
 829      handles writing the ZT state back to thread TID.  */
 830   aarch64_zt_regs_copy_from_reg_buf (tid, regcache, zt_regnum);
 831
 832   /* We need to return the expected data in BUF, so copy whatever the kernel
 833      already has to BUF.  */
 834
 835   /* Obtain a dump of NT_ARM_ZT from ptrace.  */
 836   gdb::byte_vector zt_state = aarch64_fetch_zt_regset (tid);
 837   memcpy (buf, zt_state.data (), zt_state.size ());
 838 }
 839
 840 /* Array containing all the possible register sets for AArch64/Linux.  During
 841    architecture setup, these will be checked against the HWCAP/HWCAP2 bits for
 842    validity and enabled/disabled accordingly.
 843
 844    Their sizes are set to 0 here, but they will be adjusted later depending
 845    on whether each register set is available or not.  */
 846 static struct regset_info aarch64_regsets[] =
 847 {
 848   /* GPR registers.  */
 849   { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_PRSTATUS,
 850     0, GENERAL_REGS,
 851     aarch64_fill_gregset, aarch64_store_gregset },
 852   /* Floating Point (FPU) registers.  */
 853   { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_FPREGSET,
 854     0, FP_REGS,
 855     aarch64_fill_fpregset, aarch64_store_fpregset
 856   },
 857   /* Scalable Vector Extension (SVE) registers.  */
 858   { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_ARM_SVE,
 859     0, EXTENDED_REGS,
 860     aarch64_sve_regs_copy_from_regcache, aarch64_sve_regs_copy_to_regcache
 861   },
 862   /* Scalable Matrix Extension (SME) ZA register.  */
 863   { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_ARM_ZA,
 864     0, EXTENDED_REGS,
 865     aarch64_za_regs_copy_from_regcache, aarch64_za_regs_copy_to_regcache
 866   },
 867   /* Scalable Matrix Extension 2 (SME2) ZT registers.  */
 868   { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_ARM_ZT,
 869     0, EXTENDED_REGS,
 870     aarch64_zt_regs_copy_from_regcache, aarch64_zt_regs_copy_to_regcache
 871   },
 872   /* PAC registers.  */
 873   { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_ARM_PAC_MASK,
 874     0, OPTIONAL_REGS,
 875     nullptr, aarch64_store_pauthregset },
 876   /* Tagged address control / MTE registers.  */
 877   { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_ARM_TAGGED_ADDR_CTRL,
 878     0, OPTIONAL_REGS,
 879     aarch64_fill_mteregset, aarch64_store_mteregset },
 880   /* TLS register.  */
 881   { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_ARM_TLS,
 882     0, OPTIONAL_REGS,
 883     aarch64_fill_tlsregset, aarch64_store_tlsregset },
 884   NULL_REGSET
 885 };
 886
 887 static struct regsets_info aarch64_regsets_info =
 888   {
 889     aarch64_regsets, /* regsets */
 890     0, /* num_regsets */
 891     nullptr, /* disabled_regsets */
 892   };
 893
 894 static struct regs_info regs_info_aarch64 =
 895   {
 896     nullptr, /* regset_bitmap */
 897     nullptr, /* usrregs */
 898     &aarch64_regsets_info,
 899   };
 900
 901 /* Given FEATURES, adjust the available register sets by setting their
 902    sizes.  A size of 0 means the register set is disabled and won't be
 903    used.  */
 904
 905 static void
 906 aarch64_adjust_register_sets (const struct aarch64_features &features)
 907 {
 908   struct regset_info *regset;
 909
 910   for (regset = aarch64_regsets; regset->size >= 0; regset++)
 911     {
 912       switch (regset->nt_type)
 913         {
 914         case NT_PRSTATUS:
 915           /* General purpose registers are always present.  */
 916           regset->size = sizeof (struct user_pt_regs);
 917           break;
 918         case NT_FPREGSET:
 919           /* This is unavailable when SVE is present.  */
 920           if (features.vq == 0)
 921             regset->size = sizeof (struct user_fpsimd_state);
 922           break;
 923         case NT_ARM_SVE:
 924           if (features.vq > 0)
 925             regset->size = SVE_PT_SIZE (AARCH64_MAX_SVE_VQ, SVE_PT_REGS_SVE);
 926           break;
 927         case NT_ARM_PAC_MASK:
 928           if (features.pauth)
 929             regset->size = AARCH64_PAUTH_REGS_SIZE;
 930           break;
 931         case NT_ARM_TAGGED_ADDR_CTRL:
 932           if (features.mte)
 933             regset->size = AARCH64_LINUX_SIZEOF_MTE;
 934           break;
 935         case NT_ARM_TLS:
 936           if (features.tls > 0)
 937             regset->size = AARCH64_TLS_REGISTER_SIZE * features.tls;
 938           break;
 939         case NT_ARM_ZA:
 940           if (features.svq > 0)
 941             regset->size = ZA_PT_SIZE (features.svq);
 942           break;
 943         case NT_ARM_ZT:
 944           if (features.sme2)
 945             regset->size = AARCH64_SME2_ZT0_SIZE;
 946           break;
 947         default:
 948           gdb_assert_not_reached ("Unknown register set found.");
 949         }
 950     }
 951 }
 952
 953 /* Matches HWCAP_PACA in kernel header arch/arm64/include/uapi/asm/hwcap.h.  */
 954 #define AARCH64_HWCAP_PACA (1 << 30)
 955
 956 /* Implementation of linux target ops method "low_arch_setup".  */
 957
 958 void
 959 aarch64_target::low_arch_setup ()
 960 {
 961   unsigned int machine;
 962   int is_elf64;
 963   int tid;
 964
 965   tid = lwpid_of (current_thread);
 966
 967   is_elf64 = linux_pid_exe_is_elf_64_file (tid, &machine);
 968
 969   if (is_elf64)
 970     {
 971       struct aarch64_features features;
 972       int pid = current_thread->id.pid ();
 973
 974       features.vq = aarch64_sve_get_vq (tid);
 975       /* A-profile PAC is 64-bit only.  */
 976       features.pauth = linux_get_hwcap (pid, 8) & AARCH64_HWCAP_PACA;
 977       /* A-profile MTE is 64-bit only.  */
 978       features.mte = linux_get_hwcap2 (pid, 8) & HWCAP2_MTE;
 979       features.tls = aarch64_tls_register_count (tid);
 980
 981       /* Scalable Matrix Extension feature and size check.  */
 982       if (linux_get_hwcap2 (pid, 8) & HWCAP2_SME)
 983         features.svq = aarch64_za_get_svq (tid);
 984
 985       /* Scalable Matrix Extension 2 feature check.  */
 986       CORE_ADDR hwcap2 = linux_get_hwcap2 (pid, 8);
 987       if ((hwcap2 & HWCAP2_SME2) || (hwcap2 & HWCAP2_SME2P1))
 988         {
 989           /* Make sure ptrace supports NT_ARM_ZT.  */
 990           features.sme2 = supports_zt_registers (tid);
 991         }
 992
 993       current_process ()->tdesc = aarch64_linux_read_description (features);
 994
 995       /* Adjust the register sets we should use for this particular set of
 996          features.  */
 997       aarch64_adjust_register_sets (features);
 998     }
 999   else
1000     current_process ()->tdesc = aarch32_linux_read_description ();
1001
1002   aarch64_linux_get_debug_reg_capacity (lwpid_of (current_thread));
1003 }
1004
1005 /* Implementation of linux target ops method "get_regs_info".  */
1006
1007 const regs_info *
1008 aarch64_target::get_regs_info ()
1009 {
1010   if (!is_64bit_tdesc ())
1011     return &regs_info_aarch32;
1012
1013   /* AArch64 64-bit registers.  */
1014   return &regs_info_aarch64;
1015 }
1016
1017 /* Implementation of target ops method "supports_tracepoints".  */
1018
1019 bool
1020 aarch64_target::supports_tracepoints ()
1021 {
1022   if (current_thread == NULL)
1023     return true;
1024   else
1025     {
1026       /* We don't support tracepoints on aarch32 now.  */
1027       return is_64bit_tdesc ();
1028     }
1029 }
1030
1031 /* Implementation of linux target ops method "low_get_thread_area".  */
1032
1033 int
1034 aarch64_target::low_get_thread_area (int lwpid, CORE_ADDR *addrp)
1035 {
1036   struct iovec iovec;
1037   uint64_t reg;
1038
1039   iovec.iov_base = &reg;
1040   iovec.iov_len = sizeof (reg);
1041
1042   if (ptrace (PTRACE_GETREGSET, lwpid, NT_ARM_TLS, &iovec) != 0)
1043     return -1;
1044
1045   *addrp = reg;
1046
1047   return 0;
1048 }
1049
1050 bool
1051 aarch64_target::low_supports_catch_syscall ()
1052 {
1053   return true;
1054 }
1055
1056 /* Implementation of linux target ops method "low_get_syscall_trapinfo".  */
1057
1058 void
1059 aarch64_target::low_get_syscall_trapinfo (regcache *regcache, int *sysno)
1060 {
1061   int use_64bit = register_size (regcache->tdesc, 0) == 8;
1062
1063   if (use_64bit)
1064     {
1065       long l_sysno;
1066
1067       collect_register_by_name (regcache, "x8", &l_sysno);
1068       *sysno = (int) l_sysno;
1069     }
1070   else
1071     collect_register_by_name (regcache, "r7", sysno);
1072 }
1073
1074 /* List of condition codes that we need.  */
1075
1076 enum aarch64_condition_codes
1077 {
1078   EQ = 0x0,
1079   NE = 0x1,
1080   LO = 0x3,
1081   GE = 0xa,
1082   LT = 0xb,
1083   GT = 0xc,
1084   LE = 0xd,
1085 };
1086
1087 enum aarch64_operand_type
1088 {
1089   OPERAND_IMMEDIATE,
1090   OPERAND_REGISTER,
1091 };
1092
1093 /* Representation of an operand.  At this time, it only supports register
1094    and immediate types.  */
1095
1096 struct aarch64_operand
1097 {
1098   /* Type of the operand.  */
1099   enum aarch64_operand_type type;
1100
1101   /* Value of the operand according to the type.  */
1102   union
1103     {
1104       uint32_t imm;
1105       struct aarch64_register reg;
1106     };
1107 };
1108
1109 /* List of registers that we are currently using, we can add more here as
1110    we need to use them.  */
1111
1112 /* General purpose scratch registers (64 bit).  */
1113 static const struct aarch64_register x0 = { 0, 1 };
1114 static const struct aarch64_register x1 = { 1, 1 };
1115 static const struct aarch64_register x2 = { 2, 1 };
1116 static const struct aarch64_register x3 = { 3, 1 };
1117 static const struct aarch64_register x4 = { 4, 1 };
1118
1119 /* General purpose scratch registers (32 bit).  */
1120 static const struct aarch64_register w0 = { 0, 0 };
1121 static const struct aarch64_register w2 = { 2, 0 };
1122
1123 /* Intra-procedure scratch registers.  */
1124 static const struct aarch64_register ip0 = { 16, 1 };
1125
1126 /* Special purpose registers.  */
1127 static const struct aarch64_register fp = { 29, 1 };
1128 static const struct aarch64_register lr = { 30, 1 };
1129 static const struct aarch64_register sp = { 31, 1 };
1130 static const struct aarch64_register xzr = { 31, 1 };
1131
1132 /* Dynamically allocate a new register.  If we know the register
1133    statically, we should make it a global as above instead of using this
1134    helper function.  */
1135
1136 static struct aarch64_register
1137 aarch64_register (unsigned num, int is64)
1138 {
1139   return (struct aarch64_register) { num, is64 };
1140 }
1141
1142 /* Helper function to create a register operand, for instructions with
1143    different types of operands.
1144
1145    For example:
1146    p += emit_mov (p, x0, register_operand (x1));  */
1147
1148 static struct aarch64_operand
1149 register_operand (struct aarch64_register reg)
1150 {
1151   struct aarch64_operand operand;
1152
1153   operand.type = OPERAND_REGISTER;
1154   operand.reg = reg;
1155
1156   return operand;
1157 }
1158
1159 /* Helper function to create an immediate operand, for instructions with
1160    different types of operands.
1161
1162    For example:
1163    p += emit_mov (p, x0, immediate_operand (12));  */
1164
1165 static struct aarch64_operand
1166 immediate_operand (uint32_t imm)
1167 {
1168   struct aarch64_operand operand;
1169
1170   operand.type = OPERAND_IMMEDIATE;
1171   operand.imm = imm;
1172
1173   return operand;
1174 }
1175
1176 /* Helper function to create an offset memory operand.
1177
1178    For example:
1179    p += emit_ldr (p, x0, sp, offset_memory_operand (16));  */
1180
1181 static struct aarch64_memory_operand
1182 offset_memory_operand (int32_t offset)
1183 {
1184   return (struct aarch64_memory_operand) { MEMORY_OPERAND_OFFSET, offset };
1185 }
1186
1187 /* Helper function to create a pre-index memory operand.
1188
1189    For example:
1190    p += emit_ldr (p, x0, sp, preindex_memory_operand (16));  */
1191
1192 static struct aarch64_memory_operand
1193 preindex_memory_operand (int32_t index)
1194 {
1195   return (struct aarch64_memory_operand) { MEMORY_OPERAND_PREINDEX, index };
1196 }
1197
1198 /* Helper function to create a post-index memory operand.
1199
1200    For example:
1201    p += emit_ldr (p, x0, sp, postindex_memory_operand (16));  */
1202
1203 static struct aarch64_memory_operand
1204 postindex_memory_operand (int32_t index)
1205 {
1206   return (struct aarch64_memory_operand) { MEMORY_OPERAND_POSTINDEX, index };
1207 }
1208
1209 /* System control registers.  These special registers can be written and
1210    read with the MRS and MSR instructions.
1211
1212    - NZCV: Condition flags.  GDB refers to this register under the CPSR
1213            name.
1214    - FPSR: Floating-point status register.
1215    - FPCR: Floating-point control registers.
1216    - TPIDR_EL0: Software thread ID register.  */
1217
1218 enum aarch64_system_control_registers
1219 {
1220   /*          op0           op1           crn          crm          op2  */
1221   NZCV =      (0x1 << 14) | (0x3 << 11) | (0x4 << 7) | (0x2 << 3) | 0x0,
1222   FPSR =      (0x1 << 14) | (0x3 << 11) | (0x4 << 7) | (0x4 << 3) | 0x1,
1223   FPCR =      (0x1 << 14) | (0x3 << 11) | (0x4 << 7) | (0x4 << 3) | 0x0,
1224   TPIDR_EL0 = (0x1 << 14) | (0x3 << 11) | (0xd << 7) | (0x0 << 3) | 0x2
1225 };
1226
1227 /* Write a BLR instruction into *BUF.
1228
1229      BLR rn
1230
1231    RN is the register to branch to.  */
1232
1233 static int
1234 emit_blr (uint32_t *buf, struct aarch64_register rn)
1235 {
1236   return aarch64_emit_insn (buf, BLR | ENCODE (rn.num, 5, 5));
1237 }
1238
1239 /* Write a RET instruction into *BUF.
1240
1241      RET xn
1242
1243    RN is the register to branch to.  */
1244
1245 static int
1246 emit_ret (uint32_t *buf, struct aarch64_register rn)
1247 {
1248   return aarch64_emit_insn (buf, RET | ENCODE (rn.num, 5, 5));
1249 }
1250
1251 static int
1252 emit_load_store_pair (uint32_t *buf, enum aarch64_opcodes opcode,
1253                       struct aarch64_register rt,
1254                       struct aarch64_register rt2,
1255                       struct aarch64_register rn,
1256                       struct aarch64_memory_operand operand)
1257 {
1258   uint32_t opc;
1259   uint32_t pre_index;
1260   uint32_t write_back;
1261
1262   if (rt.is64)
1263     opc = ENCODE (2, 2, 30);
1264   else
1265     opc = ENCODE (0, 2, 30);
1266
1267   switch (operand.type)
1268     {
1269     case MEMORY_OPERAND_OFFSET:
1270       {
1271         pre_index = ENCODE (1, 1, 24);
1272         write_back = ENCODE (0, 1, 23);
1273         break;
1274       }
1275     case MEMORY_OPERAND_POSTINDEX:
1276       {
1277         pre_index = ENCODE (0, 1, 24);
1278         write_back = ENCODE (1, 1, 23);
1279         break;
1280       }
1281     case MEMORY_OPERAND_PREINDEX:
1282       {
1283         pre_index = ENCODE (1, 1, 24);
1284         write_back = ENCODE (1, 1, 23);
1285         break;
1286       }
1287     default:
1288       return 0;
1289     }
1290
1291   return aarch64_emit_insn (buf, opcode | opc | pre_index | write_back
1292                             | ENCODE (operand.index >> 3, 7, 15)
1293                             | ENCODE (rt2.num, 5, 10)
1294                             | ENCODE (rn.num, 5, 5) | ENCODE (rt.num, 5, 0));
1295 }
1296
1297 /* Write a STP instruction into *BUF.
1298
1299      STP rt, rt2, [rn, #offset]
1300      STP rt, rt2, [rn, #index]!
1301      STP rt, rt2, [rn], #index
1302
1303    RT and RT2 are the registers to store.
1304    RN is the base address register.
1305    OFFSET is the immediate to add to the base address.  It is limited to a
1306    -512 .. 504 range (7 bits << 3).  */
1307
1308 static int
1309 emit_stp (uint32_t *buf, struct aarch64_register rt,
1310           struct aarch64_register rt2, struct aarch64_register rn,
1311           struct aarch64_memory_operand operand)
1312 {
1313   return emit_load_store_pair (buf, STP, rt, rt2, rn, operand);
1314 }
1315
1316 /* Write a LDP instruction into *BUF.
1317
1318      LDP rt, rt2, [rn, #offset]
1319      LDP rt, rt2, [rn, #index]!
1320      LDP rt, rt2, [rn], #index
1321
1322    RT and RT2 are the registers to store.
1323    RN is the base address register.
1324    OFFSET is the immediate to add to the base address.  It is limited to a
1325    -512 .. 504 range (7 bits << 3).  */
1326
1327 static int
1328 emit_ldp (uint32_t *buf, struct aarch64_register rt,
1329           struct aarch64_register rt2, struct aarch64_register rn,
1330           struct aarch64_memory_operand operand)
1331 {
1332   return emit_load_store_pair (buf, LDP, rt, rt2, rn, operand);
1333 }
1334
1335 /* Write a LDP (SIMD&VFP) instruction using Q registers into *BUF.
1336
1337      LDP qt, qt2, [rn, #offset]
1338
1339    RT and RT2 are the Q registers to store.
1340    RN is the base address register.
1341    OFFSET is the immediate to add to the base address.  It is limited to
1342    -1024 .. 1008 range (7 bits << 4).  */
1343
1344 static int
1345 emit_ldp_q_offset (uint32_t *buf, unsigned rt, unsigned rt2,
1346                    struct aarch64_register rn, int32_t offset)
1347 {
1348   uint32_t opc = ENCODE (2, 2, 30);
1349   uint32_t pre_index = ENCODE (1, 1, 24);
1350
1351   return aarch64_emit_insn (buf, LDP_SIMD_VFP | opc | pre_index
1352                             | ENCODE (offset >> 4, 7, 15)
1353                             | ENCODE (rt2, 5, 10)
1354                             | ENCODE (rn.num, 5, 5) | ENCODE (rt, 5, 0));
1355 }
1356
1357 /* Write a STP (SIMD&VFP) instruction using Q registers into *BUF.
1358
1359      STP qt, qt2, [rn, #offset]
1360
1361    RT and RT2 are the Q registers to store.
1362    RN is the base address register.
1363    OFFSET is the immediate to add to the base address.  It is limited to
1364    -1024 .. 1008 range (7 bits << 4).  */
1365
1366 static int
1367 emit_stp_q_offset (uint32_t *buf, unsigned rt, unsigned rt2,
1368                    struct aarch64_register rn, int32_t offset)
1369 {
1370   uint32_t opc = ENCODE (2, 2, 30);
1371   uint32_t pre_index = ENCODE (1, 1, 24);
1372
1373   return aarch64_emit_insn (buf, STP_SIMD_VFP | opc | pre_index
1374                             | ENCODE (offset >> 4, 7, 15)
1375                             | ENCODE (rt2, 5, 10)
1376                             | ENCODE (rn.num, 5, 5) | ENCODE (rt, 5, 0));
1377 }
1378
1379 /* Write a LDRH instruction into *BUF.
1380
1381      LDRH wt, [xn, #offset]
1382      LDRH wt, [xn, #index]!
1383      LDRH wt, [xn], #index
1384
1385    RT is the register to store.
1386    RN is the base address register.
1387    OFFSET is the immediate to add to the base address.  It is limited to
1388    0 .. 32760 range (12 bits << 3).  */
1389
1390 static int
1391 emit_ldrh (uint32_t *buf, struct aarch64_register rt,
1392            struct aarch64_register rn,
1393            struct aarch64_memory_operand operand)
1394 {
1395   return aarch64_emit_load_store (buf, 1, LDR, rt, rn, operand);
1396 }
1397
1398 /* Write a LDRB instruction into *BUF.
1399
1400      LDRB wt, [xn, #offset]
1401      LDRB wt, [xn, #index]!
1402      LDRB wt, [xn], #index
1403
1404    RT is the register to store.
1405    RN is the base address register.
1406    OFFSET is the immediate to add to the base address.  It is limited to
1407    0 .. 32760 range (12 bits << 3).  */
1408
1409 static int
1410 emit_ldrb (uint32_t *buf, struct aarch64_register rt,
1411            struct aarch64_register rn,
1412            struct aarch64_memory_operand operand)
1413 {
1414   return aarch64_emit_load_store (buf, 0, LDR, rt, rn, operand);
1415 }
1416
1417
1418
1419 /* Write a STR instruction into *BUF.
1420
1421      STR rt, [rn, #offset]
1422      STR rt, [rn, #index]!
1423      STR rt, [rn], #index
1424
1425    RT is the register to store.
1426    RN is the base address register.
1427    OFFSET is the immediate to add to the base address.  It is limited to
1428    0 .. 32760 range (12 bits << 3).  */
1429
1430 static int
1431 emit_str (uint32_t *buf, struct aarch64_register rt,
1432           struct aarch64_register rn,
1433           struct aarch64_memory_operand operand)
1434 {
1435   return aarch64_emit_load_store (buf, rt.is64 ? 3 : 2, STR, rt, rn, operand);
1436 }
1437
1438 /* Helper function emitting an exclusive load or store instruction.  */
1439
1440 static int
1441 emit_load_store_exclusive (uint32_t *buf, uint32_t size,
1442                            enum aarch64_opcodes opcode,
1443                            struct aarch64_register rs,
1444                            struct aarch64_register rt,
1445                            struct aarch64_register rt2,
1446                            struct aarch64_register rn)
1447 {
1448   return aarch64_emit_insn (buf, opcode | ENCODE (size, 2, 30)
1449                             | ENCODE (rs.num, 5, 16) | ENCODE (rt2.num, 5, 10)
1450                             | ENCODE (rn.num, 5, 5) | ENCODE (rt.num, 5, 0));
1451 }
1452
1453 /* Write a LAXR instruction into *BUF.
1454
1455      LDAXR rt, [xn]
1456
1457    RT is the destination register.
1458    RN is the base address register.  */
1459
1460 static int
1461 emit_ldaxr (uint32_t *buf, struct aarch64_register rt,
1462             struct aarch64_register rn)
1463 {
1464   return emit_load_store_exclusive (buf, rt.is64 ? 3 : 2, LDAXR, xzr, rt,
1465                                     xzr, rn);
1466 }
1467
1468 /* Write a STXR instruction into *BUF.
1469
1470      STXR ws, rt, [xn]
1471
1472    RS is the result register, it indicates if the store succeeded or not.
1473    RT is the destination register.
1474    RN is the base address register.  */
1475
1476 static int
1477 emit_stxr (uint32_t *buf, struct aarch64_register rs,
1478            struct aarch64_register rt, struct aarch64_register rn)
1479 {
1480   return emit_load_store_exclusive (buf, rt.is64 ? 3 : 2, STXR, rs, rt,
1481                                     xzr, rn);
1482 }
1483
1484 /* Write a STLR instruction into *BUF.
1485
1486      STLR rt, [xn]
1487
1488    RT is the register to store.
1489    RN is the base address register.  */
1490
1491 static int
1492 emit_stlr (uint32_t *buf, struct aarch64_register rt,
1493            struct aarch64_register rn)
1494 {
1495   return emit_load_store_exclusive (buf, rt.is64 ? 3 : 2, STLR, xzr, rt,
1496                                     xzr, rn);
1497 }
1498
1499 /* Helper function for data processing instructions with register sources.  */
1500
1501 static int
1502 emit_data_processing_reg (uint32_t *buf, uint32_t opcode,
1503                           struct aarch64_register rd,
1504                           struct aarch64_register rn,
1505                           struct aarch64_register rm)
1506 {
1507   uint32_t size = ENCODE (rd.is64, 1, 31);
1508
1509   return aarch64_emit_insn (buf, opcode | size | ENCODE (rm.num, 5, 16)
1510                             | ENCODE (rn.num, 5, 5) | ENCODE (rd.num, 5, 0));
1511 }
1512
1513 /* Helper function for data processing instructions taking either a register
1514    or an immediate.  */
1515
1516 static int
1517 emit_data_processing (uint32_t *buf, enum aarch64_opcodes opcode,
1518                       struct aarch64_register rd,
1519                       struct aarch64_register rn,
1520                       struct aarch64_operand operand)
1521 {
1522   uint32_t size = ENCODE (rd.is64, 1, 31);
1523   /* The opcode is different for register and immediate source operands.  */
1524   uint32_t operand_opcode;
1525
1526   if (operand.type == OPERAND_IMMEDIATE)
1527     {
1528       /* xxx1 000x xxxx xxxx xxxx xxxx xxxx xxxx */
1529       operand_opcode = ENCODE (8, 4, 25);
1530
1531       return aarch64_emit_insn (buf, opcode | operand_opcode | size
1532                                 | ENCODE (operand.imm, 12, 10)
1533                                 | ENCODE (rn.num, 5, 5)
1534                                 | ENCODE (rd.num, 5, 0));
1535     }
1536   else
1537     {
1538       /* xxx0 101x xxxx xxxx xxxx xxxx xxxx xxxx */
1539       operand_opcode = ENCODE (5, 4, 25);
1540
1541       return emit_data_processing_reg (buf, opcode | operand_opcode, rd,
1542                                        rn, operand.reg);
1543     }
1544 }
1545
1546 /* Write an ADD instruction into *BUF.
1547
1548      ADD rd, rn, #imm
1549      ADD rd, rn, rm
1550
1551    This function handles both an immediate and register add.
1552
1553    RD is the destination register.
1554    RN is the input register.
1555    OPERAND is the source operand, either of type OPERAND_IMMEDIATE or
1556    OPERAND_REGISTER.  */
1557
1558 static int
1559 emit_add (uint32_t *buf, struct aarch64_register rd,
1560           struct aarch64_register rn, struct aarch64_operand operand)
1561 {
1562   return emit_data_processing (buf, ADD, rd, rn, operand);
1563 }
1564
1565 /* Write a SUB instruction into *BUF.
1566
1567      SUB rd, rn, #imm
1568      SUB rd, rn, rm
1569
1570    This function handles both an immediate and register sub.
1571
1572    RD is the destination register.
1573    RN is the input register.
1574    IMM is the immediate to substract to RN.  */
1575
1576 static int
1577 emit_sub (uint32_t *buf, struct aarch64_register rd,
1578           struct aarch64_register rn, struct aarch64_operand operand)
1579 {
1580   return emit_data_processing (buf, SUB, rd, rn, operand);
1581 }
1582
1583 /* Write a MOV instruction into *BUF.
1584
1585      MOV rd, #imm
1586      MOV rd, rm
1587
1588    This function handles both a wide immediate move and a register move,
1589    with the condition that the source register is not xzr.  xzr and the
1590    stack pointer share the same encoding and this function only supports
1591    the stack pointer.
1592
1593    RD is the destination register.
1594    OPERAND is the source operand, either of type OPERAND_IMMEDIATE or
1595    OPERAND_REGISTER.  */
1596
1597 static int
1598 emit_mov (uint32_t *buf, struct aarch64_register rd,
1599           struct aarch64_operand operand)
1600 {
1601   if (operand.type == OPERAND_IMMEDIATE)
1602     {
1603       uint32_t size = ENCODE (rd.is64, 1, 31);
1604       /* Do not shift the immediate.  */
1605       uint32_t shift = ENCODE (0, 2, 21);
1606
1607       return aarch64_emit_insn (buf, MOV | size | shift
1608                                 | ENCODE (operand.imm, 16, 5)
1609                                 | ENCODE (rd.num, 5, 0));
1610     }
1611   else
1612     return emit_add (buf, rd, operand.reg, immediate_operand (0));
1613 }
1614
1615 /* Write a MOVK instruction into *BUF.
1616
1617      MOVK rd, #imm, lsl #shift
1618
1619    RD is the destination register.
1620    IMM is the immediate.
1621    SHIFT is the logical shift left to apply to IMM.   */
1622
1623 static int
1624 emit_movk (uint32_t *buf, struct aarch64_register rd, uint32_t imm,
1625            unsigned shift)
1626 {
1627   uint32_t size = ENCODE (rd.is64, 1, 31);
1628
1629   return aarch64_emit_insn (buf, MOVK | size | ENCODE (shift, 2, 21) |
1630                             ENCODE (imm, 16, 5) | ENCODE (rd.num, 5, 0));
1631 }
1632
1633 /* Write instructions into *BUF in order to move ADDR into a register.
1634    ADDR can be a 64-bit value.
1635
1636    This function will emit a series of MOV and MOVK instructions, such as:
1637
1638      MOV  xd, #(addr)
1639      MOVK xd, #(addr >> 16), lsl #16
1640      MOVK xd, #(addr >> 32), lsl #32
1641      MOVK xd, #(addr >> 48), lsl #48  */
1642
1643 static int
1644 emit_mov_addr (uint32_t *buf, struct aarch64_register rd, CORE_ADDR addr)
1645 {
1646   uint32_t *p = buf;
1647
1648   /* The MOV (wide immediate) instruction clears to top bits of the
1649      register.  */
1650   p += emit_mov (p, rd, immediate_operand (addr & 0xffff));
1651
1652   if ((addr >> 16) != 0)
1653     p += emit_movk (p, rd, (addr >> 16) & 0xffff, 1);
1654   else
1655     return p - buf;
1656
1657   if ((addr >> 32) != 0)
1658     p += emit_movk (p, rd, (addr >> 32) & 0xffff, 2);
1659   else
1660     return p - buf;
1661
1662   if ((addr >> 48) != 0)
1663     p += emit_movk (p, rd, (addr >> 48) & 0xffff, 3);
1664
1665   return p - buf;
1666 }
1667
1668 /* Write a SUBS instruction into *BUF.
1669
1670      SUBS rd, rn, rm
1671
1672    This instruction update the condition flags.
1673
1674    RD is the destination register.
1675    RN and RM are the source registers.  */
1676
1677 static int
1678 emit_subs (uint32_t *buf, struct aarch64_register rd,
1679            struct aarch64_register rn, struct aarch64_operand operand)
1680 {
1681   return emit_data_processing (buf, SUBS, rd, rn, operand);
1682 }
1683
1684 /* Write a CMP instruction into *BUF.
1685
1686      CMP rn, rm
1687
1688    This instruction is an alias of SUBS xzr, rn, rm.
1689
1690    RN and RM are the registers to compare.  */
1691
1692 static int
1693 emit_cmp (uint32_t *buf, struct aarch64_register rn,
1694               struct aarch64_operand operand)
1695 {
1696   return emit_subs (buf, xzr, rn, operand);
1697 }
1698
1699 /* Write a AND instruction into *BUF.
1700
1701      AND rd, rn, rm
1702
1703    RD is the destination register.
1704    RN and RM are the source registers.  */
1705
1706 static int
1707 emit_and (uint32_t *buf, struct aarch64_register rd,
1708           struct aarch64_register rn, struct aarch64_register rm)
1709 {
1710   return emit_data_processing_reg (buf, AND, rd, rn, rm);
1711 }
1712
1713 /* Write a ORR instruction into *BUF.
1714
1715      ORR rd, rn, rm
1716
1717    RD is the destination register.
1718    RN and RM are the source registers.  */
1719
1720 static int
1721 emit_orr (uint32_t *buf, struct aarch64_register rd,
1722           struct aarch64_register rn, struct aarch64_register rm)
1723 {
1724   return emit_data_processing_reg (buf, ORR, rd, rn, rm);
1725 }
1726
1727 /* Write a ORN instruction into *BUF.
1728
1729      ORN rd, rn, rm
1730
1731    RD is the destination register.
1732    RN and RM are the source registers.  */
1733
1734 static int
1735 emit_orn (uint32_t *buf, struct aarch64_register rd,
1736           struct aarch64_register rn, struct aarch64_register rm)
1737 {
1738   return emit_data_processing_reg (buf, ORN, rd, rn, rm);
1739 }
1740
1741 /* Write a EOR instruction into *BUF.
1742
1743      EOR rd, rn, rm
1744
1745    RD is the destination register.
1746    RN and RM are the source registers.  */
1747
1748 static int
1749 emit_eor (uint32_t *buf, struct aarch64_register rd,
1750           struct aarch64_register rn, struct aarch64_register rm)
1751 {
1752   return emit_data_processing_reg (buf, EOR, rd, rn, rm);
1753 }
1754
1755 /* Write a MVN instruction into *BUF.
1756
1757      MVN rd, rm
1758
1759    This is an alias for ORN rd, xzr, rm.
1760
1761    RD is the destination register.
1762    RM is the source register.  */
1763
1764 static int
1765 emit_mvn (uint32_t *buf, struct aarch64_register rd,
1766           struct aarch64_register rm)
1767 {
1768   return emit_orn (buf, rd, xzr, rm);
1769 }
1770
1771 /* Write a LSLV instruction into *BUF.
1772
1773      LSLV rd, rn, rm
1774
1775    RD is the destination register.
1776    RN and RM are the source registers.  */
1777
1778 static int
1779 emit_lslv (uint32_t *buf, struct aarch64_register rd,
1780            struct aarch64_register rn, struct aarch64_register rm)
1781 {
1782   return emit_data_processing_reg (buf, LSLV, rd, rn, rm);
1783 }
1784
1785 /* Write a LSRV instruction into *BUF.
1786
1787      LSRV rd, rn, rm
1788
1789    RD is the destination register.
1790    RN and RM are the source registers.  */
1791
1792 static int
1793 emit_lsrv (uint32_t *buf, struct aarch64_register rd,
1794            struct aarch64_register rn, struct aarch64_register rm)
1795 {
1796   return emit_data_processing_reg (buf, LSRV, rd, rn, rm);
1797 }
1798
1799 /* Write a ASRV instruction into *BUF.
1800
1801      ASRV rd, rn, rm
1802
1803    RD is the destination register.
1804    RN and RM are the source registers.  */
1805
1806 static int
1807 emit_asrv (uint32_t *buf, struct aarch64_register rd,
1808            struct aarch64_register rn, struct aarch64_register rm)
1809 {
1810   return emit_data_processing_reg (buf, ASRV, rd, rn, rm);
1811 }
1812
1813 /* Write a MUL instruction into *BUF.
1814
1815      MUL rd, rn, rm
1816
1817    RD is the destination register.
1818    RN and RM are the source registers.  */
1819
1820 static int
1821 emit_mul (uint32_t *buf, struct aarch64_register rd,
1822           struct aarch64_register rn, struct aarch64_register rm)
1823 {
1824   return emit_data_processing_reg (buf, MUL, rd, rn, rm);
1825 }
1826
1827 /* Write a MRS instruction into *BUF.  The register size is 64-bit.
1828
1829      MRS xt, system_reg
1830
1831    RT is the destination register.
1832    SYSTEM_REG is special purpose register to read.  */
1833
1834 static int
1835 emit_mrs (uint32_t *buf, struct aarch64_register rt,
1836           enum aarch64_system_control_registers system_reg)
1837 {
1838   return aarch64_emit_insn (buf, MRS | ENCODE (system_reg, 15, 5)
1839                             | ENCODE (rt.num, 5, 0));
1840 }
1841
1842 /* Write a MSR instruction into *BUF.  The register size is 64-bit.
1843
1844      MSR system_reg, xt
1845
1846    SYSTEM_REG is special purpose register to write.
1847    RT is the input register.  */
1848
1849 static int
1850 emit_msr (uint32_t *buf, enum aarch64_system_control_registers system_reg,
1851           struct aarch64_register rt)
1852 {
1853   return aarch64_emit_insn (buf, MSR | ENCODE (system_reg, 15, 5)
1854                             | ENCODE (rt.num, 5, 0));
1855 }
1856
1857 /* Write a SEVL instruction into *BUF.
1858
1859    This is a hint instruction telling the hardware to trigger an event.  */
1860
1861 static int
1862 emit_sevl (uint32_t *buf)
1863 {
1864   return aarch64_emit_insn (buf, SEVL);
1865 }
1866
1867 /* Write a WFE instruction into *BUF.
1868
1869    This is a hint instruction telling the hardware to wait for an event.  */
1870
1871 static int
1872 emit_wfe (uint32_t *buf)
1873 {
1874   return aarch64_emit_insn (buf, WFE);
1875 }
1876
1877 /* Write a SBFM instruction into *BUF.
1878
1879      SBFM rd, rn, #immr, #imms
1880
1881    This instruction moves the bits from #immr to #imms into the
1882    destination, sign extending the result.
1883
1884    RD is the destination register.
1885    RN is the source register.
1886    IMMR is the bit number to start at (least significant bit).
1887    IMMS is the bit number to stop at (most significant bit).  */
1888
1889 static int
1890 emit_sbfm (uint32_t *buf, struct aarch64_register rd,
1891            struct aarch64_register rn, uint32_t immr, uint32_t imms)
1892 {
1893   uint32_t size = ENCODE (rd.is64, 1, 31);
1894   uint32_t n = ENCODE (rd.is64, 1, 22);
1895
1896   return aarch64_emit_insn (buf, SBFM | size | n | ENCODE (immr, 6, 16)
1897                             | ENCODE (imms, 6, 10) | ENCODE (rn.num, 5, 5)
1898                             | ENCODE (rd.num, 5, 0));
1899 }
1900
1901 /* Write a SBFX instruction into *BUF.
1902
1903      SBFX rd, rn, #lsb, #width
1904
1905    This instruction moves #width bits from #lsb into the destination, sign
1906    extending the result.  This is an alias for:
1907
1908      SBFM rd, rn, #lsb, #(lsb + width - 1)
1909
1910    RD is the destination register.
1911    RN is the source register.
1912    LSB is the bit number to start at (least significant bit).
1913    WIDTH is the number of bits to move.  */
1914
1915 static int
1916 emit_sbfx (uint32_t *buf, struct aarch64_register rd,
1917            struct aarch64_register rn, uint32_t lsb, uint32_t width)
1918 {
1919   return emit_sbfm (buf, rd, rn, lsb, lsb + width - 1);
1920 }
1921
1922 /* Write a UBFM instruction into *BUF.
1923
1924      UBFM rd, rn, #immr, #imms
1925
1926    This instruction moves the bits from #immr to #imms into the
1927    destination, extending the result with zeros.
1928
1929    RD is the destination register.
1930    RN is the source register.
1931    IMMR is the bit number to start at (least significant bit).
1932    IMMS is the bit number to stop at (most significant bit).  */
1933
1934 static int
1935 emit_ubfm (uint32_t *buf, struct aarch64_register rd,
1936            struct aarch64_register rn, uint32_t immr, uint32_t imms)
1937 {
1938   uint32_t size = ENCODE (rd.is64, 1, 31);
1939   uint32_t n = ENCODE (rd.is64, 1, 22);
1940
1941   return aarch64_emit_insn (buf, UBFM | size | n | ENCODE (immr, 6, 16)
1942                             | ENCODE (imms, 6, 10) | ENCODE (rn.num, 5, 5)
1943                             | ENCODE (rd.num, 5, 0));
1944 }
1945
1946 /* Write a UBFX instruction into *BUF.
1947
1948      UBFX rd, rn, #lsb, #width
1949
1950    This instruction moves #width bits from #lsb into the destination,
1951    extending the result with zeros.  This is an alias for:
1952
1953      UBFM rd, rn, #lsb, #(lsb + width - 1)
1954
1955    RD is the destination register.
1956    RN is the source register.
1957    LSB is the bit number to start at (least significant bit).
1958    WIDTH is the number of bits to move.  */
1959
1960 static int
1961 emit_ubfx (uint32_t *buf, struct aarch64_register rd,
1962            struct aarch64_register rn, uint32_t lsb, uint32_t width)
1963 {
1964   return emit_ubfm (buf, rd, rn, lsb, lsb + width - 1);
1965 }
1966
1967 /* Write a CSINC instruction into *BUF.
1968
1969      CSINC rd, rn, rm, cond
1970
1971    This instruction conditionally increments rn or rm and places the result
1972    in rd.  rn is chosen is the condition is true.
1973
1974    RD is the destination register.
1975    RN and RM are the source registers.
1976    COND is the encoded condition.  */
1977
1978 static int
1979 emit_csinc (uint32_t *buf, struct aarch64_register rd,
1980             struct aarch64_register rn, struct aarch64_register rm,
1981             unsigned cond)
1982 {
1983   uint32_t size = ENCODE (rd.is64, 1, 31);
1984
1985   return aarch64_emit_insn (buf, CSINC | size | ENCODE (rm.num, 5, 16)
1986                             | ENCODE (cond, 4, 12) | ENCODE (rn.num, 5, 5)
1987                             | ENCODE (rd.num, 5, 0));
1988 }
1989
1990 /* Write a CSET instruction into *BUF.
1991
1992      CSET rd, cond
1993
1994    This instruction conditionally write 1 or 0 in the destination register.
1995    1 is written if the condition is true.  This is an alias for:
1996
1997      CSINC rd, xzr, xzr, !cond
1998
1999    Note that the condition needs to be inverted.
2000
2001    RD is the destination register.
2002    RN and RM are the source registers.
2003    COND is the encoded condition.  */
2004
2005 static int
2006 emit_cset (uint32_t *buf, struct aarch64_register rd, unsigned cond)
2007 {
2008   /* The least significant bit of the condition needs toggling in order to
2009      invert it.  */
2010   return emit_csinc (buf, rd, xzr, xzr, cond ^ 0x1);
2011 }
2012
2013 /* Write LEN instructions from BUF into the inferior memory at *TO.
2014
2015    Note instructions are always little endian on AArch64, unlike data.  */
2016
2017 static void
2018 append_insns (CORE_ADDR *to, size_t len, const uint32_t *buf)
2019 {
2020   size_t byte_len = len * sizeof (uint32_t);
2021 #if (__BYTE_ORDER == __BIG_ENDIAN)
2022   uint32_t *le_buf = (uint32_t *) xmalloc (byte_len);
2023   size_t i;
2024
2025   for (i = 0; i < len; i++)
2026     le_buf[i] = htole32 (buf[i]);
2027
2028   target_write_memory (*to, (const unsigned char *) le_buf, byte_len);
2029
2030   xfree (le_buf);
2031 #else
2032   target_write_memory (*to, (const unsigned char *) buf, byte_len);
2033 #endif
2034
2035   *to += byte_len;
2036 }
2037
2038 /* Sub-class of struct aarch64_insn_data, store information of
2039    instruction relocation for fast tracepoint.  Visitor can
2040    relocate an instruction from BASE.INSN_ADDR to NEW_ADDR and save
2041    the relocated instructions in buffer pointed by INSN_PTR.  */
2042
2043 struct aarch64_insn_relocation_data
2044 {
2045   struct aarch64_insn_data base;
2046
2047   /* The new address the instruction is relocated to.  */
2048   CORE_ADDR new_addr;
2049   /* Pointer to the buffer of relocated instruction(s).  */
2050   uint32_t *insn_ptr;
2051 };
2052
2053 /* Implementation of aarch64_insn_visitor method "b".  */
2054
2055 static void
2056 aarch64_ftrace_insn_reloc_b (const int is_bl, const int32_t offset,
2057                              struct aarch64_insn_data *data)
2058 {
2059   struct aarch64_insn_relocation_data *insn_reloc
2060     = (struct aarch64_insn_relocation_data *) data;
2061   int64_t new_offset
2062     = insn_reloc->base.insn_addr - insn_reloc->new_addr + offset;
2063
2064   if (can_encode_int32 (new_offset, 28))
2065     insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, is_bl, new_offset);
2066 }
2067
2068 /* Implementation of aarch64_insn_visitor method "b_cond".  */
2069
2070 static void
2071 aarch64_ftrace_insn_reloc_b_cond (const unsigned cond, const int32_t offset,
2072                                   struct aarch64_insn_data *data)
2073 {
2074   struct aarch64_insn_relocation_data *insn_reloc
2075     = (struct aarch64_insn_relocation_data *) data;
2076   int64_t new_offset
2077     = insn_reloc->base.insn_addr - insn_reloc->new_addr + offset;
2078
2079   if (can_encode_int32 (new_offset, 21))
2080     {
2081       insn_reloc->insn_ptr += emit_bcond (insn_reloc->insn_ptr, cond,
2082                                           new_offset);
2083     }
2084   else if (can_encode_int32 (new_offset, 28))
2085     {
2086       /* The offset is out of range for a conditional branch
2087          instruction but not for a unconditional branch.  We can use
2088          the following instructions instead:
2089
2090          B.COND TAKEN    ; If cond is true, then jump to TAKEN.
2091          B NOT_TAKEN     ; Else jump over TAKEN and continue.
2092          TAKEN:
2093          B #(offset - 8)
2094          NOT_TAKEN:
2095
2096       */
2097
2098       insn_reloc->insn_ptr += emit_bcond (insn_reloc->insn_ptr, cond, 8);
2099       insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, 8);
2100       insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, new_offset - 8);
2101     }
2102 }
2103
2104 /* Implementation of aarch64_insn_visitor method "cb".  */
2105
2106 static void
2107 aarch64_ftrace_insn_reloc_cb (const int32_t offset, const int is_cbnz,
2108                               const unsigned rn, int is64,
2109                               struct aarch64_insn_data *data)
2110 {
2111   struct aarch64_insn_relocation_data *insn_reloc
2112     = (struct aarch64_insn_relocation_data *) data;
2113   int64_t new_offset
2114     = insn_reloc->base.insn_addr - insn_reloc->new_addr + offset;
2115
2116   if (can_encode_int32 (new_offset, 21))
2117     {
2118       insn_reloc->insn_ptr += emit_cb (insn_reloc->insn_ptr, is_cbnz,
2119                                        aarch64_register (rn, is64), new_offset);
2120     }
2121   else if (can_encode_int32 (new_offset, 28))
2122     {
2123       /* The offset is out of range for a compare and branch
2124          instruction but not for a unconditional branch.  We can use
2125          the following instructions instead:
2126
2127          CBZ xn, TAKEN   ; xn == 0, then jump to TAKEN.
2128          B NOT_TAKEN     ; Else jump over TAKEN and continue.
2129          TAKEN:
2130          B #(offset - 8)
2131          NOT_TAKEN:
2132
2133       */
2134       insn_reloc->insn_ptr += emit_cb (insn_reloc->insn_ptr, is_cbnz,
2135                                        aarch64_register (rn, is64), 8);
2136       insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, 8);
2137       insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, new_offset - 8);
2138     }
2139 }
2140
2141 /* Implementation of aarch64_insn_visitor method "tb".  */
2142
2143 static void
2144 aarch64_ftrace_insn_reloc_tb (const int32_t offset, int is_tbnz,
2145                               const unsigned rt, unsigned bit,
2146                               struct aarch64_insn_data *data)
2147 {
2148   struct aarch64_insn_relocation_data *insn_reloc
2149     = (struct aarch64_insn_relocation_data *) data;
2150   int64_t new_offset
2151     = insn_reloc->base.insn_addr - insn_reloc->new_addr + offset;
2152
2153   if (can_encode_int32 (new_offset, 16))
2154     {
2155       insn_reloc->insn_ptr += emit_tb (insn_reloc->insn_ptr, is_tbnz, bit,
2156                                        aarch64_register (rt, 1), new_offset);
2157     }
2158   else if (can_encode_int32 (new_offset, 28))
2159     {
2160       /* The offset is out of range for a test bit and branch
2161          instruction but not for a unconditional branch.  We can use
2162          the following instructions instead:
2163
2164          TBZ xn, #bit, TAKEN ; xn[bit] == 0, then jump to TAKEN.
2165          B NOT_TAKEN         ; Else jump over TAKEN and continue.
2166          TAKEN:
2167          B #(offset - 8)
2168          NOT_TAKEN:
2169
2170       */
2171       insn_reloc->insn_ptr += emit_tb (insn_reloc->insn_ptr, is_tbnz, bit,
2172                                        aarch64_register (rt, 1), 8);
2173       insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, 8);
2174       insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0,
2175                                       new_offset - 8);
2176     }
2177 }
2178
2179 /* Implementation of aarch64_insn_visitor method "adr".  */
2180
2181 static void
2182 aarch64_ftrace_insn_reloc_adr (const int32_t offset, const unsigned rd,
2183                                const int is_adrp,
2184                                struct aarch64_insn_data *data)
2185 {
2186   struct aarch64_insn_relocation_data *insn_reloc
2187     = (struct aarch64_insn_relocation_data *) data;
2188   /* We know exactly the address the ADR{P,} instruction will compute.
2189      We can just write it to the destination register.  */
2190   CORE_ADDR address = data->insn_addr + offset;
2191
2192   if (is_adrp)
2193     {
2194       /* Clear the lower 12 bits of the offset to get the 4K page.  */
2195       insn_reloc->insn_ptr += emit_mov_addr (insn_reloc->insn_ptr,
2196                                              aarch64_register (rd, 1),
2197                                              address & ~0xfff);
2198     }
2199   else
2200     insn_reloc->insn_ptr += emit_mov_addr (insn_reloc->insn_ptr,
2201                                            aarch64_register (rd, 1), address);
2202 }
2203
2204 /* Implementation of aarch64_insn_visitor method "ldr_literal".  */
2205
2206 static void
2207 aarch64_ftrace_insn_reloc_ldr_literal (const int32_t offset, const int is_sw,
2208                                        const unsigned rt, const int is64,
2209                                        struct aarch64_insn_data *data)
2210 {
2211   struct aarch64_insn_relocation_data *insn_reloc
2212     = (struct aarch64_insn_relocation_data *) data;
2213   CORE_ADDR address = data->insn_addr + offset;
2214
2215   insn_reloc->insn_ptr += emit_mov_addr (insn_reloc->insn_ptr,
2216                                          aarch64_register (rt, 1), address);
2217
2218   /* We know exactly what address to load from, and what register we
2219      can use:
2220
2221      MOV xd, #(oldloc + offset)
2222      MOVK xd, #((oldloc + offset) >> 16), lsl #16
2223      ...
2224
2225      LDR xd, [xd] ; or LDRSW xd, [xd]
2226
2227   */
2228
2229   if (is_sw)
2230     insn_reloc->insn_ptr += emit_ldrsw (insn_reloc->insn_ptr,
2231                                         aarch64_register (rt, 1),
2232                                         aarch64_register (rt, 1),
2233                                         offset_memory_operand (0));
2234   else
2235     insn_reloc->insn_ptr += emit_ldr (insn_reloc->insn_ptr,
2236                                       aarch64_register (rt, is64),
2237                                       aarch64_register (rt, 1),
2238                                       offset_memory_operand (0));
2239 }
2240
2241 /* Implementation of aarch64_insn_visitor method "others".  */
2242
2243 static void
2244 aarch64_ftrace_insn_reloc_others (const uint32_t insn,
2245                                   struct aarch64_insn_data *data)
2246 {
2247   struct aarch64_insn_relocation_data *insn_reloc
2248     = (struct aarch64_insn_relocation_data *) data;
2249
2250   /* The instruction is not PC relative.  Just re-emit it at the new
2251      location.  */
2252   insn_reloc->insn_ptr += aarch64_emit_insn (insn_reloc->insn_ptr, insn);
2253 }
2254
2255 static const struct aarch64_insn_visitor visitor =
2256 {
2257   aarch64_ftrace_insn_reloc_b,
2258   aarch64_ftrace_insn_reloc_b_cond,
2259   aarch64_ftrace_insn_reloc_cb,
2260   aarch64_ftrace_insn_reloc_tb,
2261   aarch64_ftrace_insn_reloc_adr,
2262   aarch64_ftrace_insn_reloc_ldr_literal,
2263   aarch64_ftrace_insn_reloc_others,
2264 };
2265
2266 bool
2267 aarch64_target::supports_fast_tracepoints ()
2268 {
2269   return true;
2270 }
2271
2272 /* Implementation of target ops method
2273    "install_fast_tracepoint_jump_pad".  */
2274
2275 int
2276 aarch64_target::install_fast_tracepoint_jump_pad
2277   (CORE_ADDR tpoint, CORE_ADDR tpaddr, CORE_ADDR collector,
2278    CORE_ADDR lockaddr, ULONGEST orig_size, CORE_ADDR *jump_entry,
2279    CORE_ADDR *trampoline, ULONGEST *trampoline_size,
2280    unsigned char *jjump_pad_insn, ULONGEST *jjump_pad_insn_size,
2281    CORE_ADDR *adjusted_insn_addr, CORE_ADDR *adjusted_insn_addr_end,
2282    char *err)
2283 {
2284   uint32_t buf[256];
2285   uint32_t *p = buf;
2286   int64_t offset;
2287   int i;
2288   uint32_t insn;
2289   CORE_ADDR buildaddr = *jump_entry;
2290   struct aarch64_insn_relocation_data insn_data;
2291
2292   /* We need to save the current state on the stack both to restore it
2293      later and to collect register values when the tracepoint is hit.
2294
2295      The saved registers are pushed in a layout that needs to be in sync
2296      with aarch64_ft_collect_regmap (see linux-aarch64-ipa.c).  Later on
2297      the supply_fast_tracepoint_registers function will fill in the
2298      register cache from a pointer to saved registers on the stack we build
2299      here.
2300
2301      For simplicity, we set the size of each cell on the stack to 16 bytes.
2302      This way one cell can hold any register type, from system registers
2303      to the 128 bit SIMD&FP registers.  Furthermore, the stack pointer
2304      has to be 16 bytes aligned anyway.
2305
2306      Note that the CPSR register does not exist on AArch64.  Instead we
2307      can access system bits describing the process state with the
2308      MRS/MSR instructions, namely the condition flags.  We save them as
2309      if they are part of a CPSR register because that's how GDB
2310      interprets these system bits.  At the moment, only the condition
2311      flags are saved in CPSR (NZCV).
2312
2313      Stack layout, each cell is 16 bytes (descending):
2314
2315      High *-------- SIMD&FP registers from 31 down to 0. --------*
2316           | q31                                                  |
2317           .                                                      .
2318           .                                                      . 32 cells
2319           .                                                      .
2320           | q0                                                   |
2321           *---- General purpose registers from 30 down to 0. ----*
2322           | x30                                                  |
2323           .                                                      .
2324           .                                                      . 31 cells
2325           .                                                      .
2326           | x0                                                   |
2327           *------------- Special purpose registers. -------------*
2328           | SP                                                   |
2329           | PC                                                   |
2330           | CPSR (NZCV)                                          | 5 cells
2331           | FPSR                                                 |
2332           | FPCR                                                 | <- SP + 16
2333           *------------- collecting_t object --------------------*
2334           | TPIDR_EL0               | struct tracepoint *        |
2335      Low  *------------------------------------------------------*
2336
2337      After this stack is set up, we issue a call to the collector, passing
2338      it the saved registers at (SP + 16).  */
2339
2340   /* Push SIMD&FP registers on the stack:
2341
2342        SUB sp, sp, #(32 * 16)
2343
2344        STP q30, q31, [sp, #(30 * 16)]
2345        ...
2346        STP q0, q1, [sp]
2347
2348      */
2349   p += emit_sub (p, sp, sp, immediate_operand (32 * 16));
2350   for (i = 30; i >= 0; i -= 2)
2351     p += emit_stp_q_offset (p, i, i + 1, sp, i * 16);
2352
2353   /* Push general purpose registers on the stack.  Note that we do not need
2354      to push x31 as it represents the xzr register and not the stack
2355      pointer in a STR instruction.
2356
2357        SUB sp, sp, #(31 * 16)
2358
2359        STR x30, [sp, #(30 * 16)]
2360        ...
2361        STR x0, [sp]
2362
2363      */
2364   p += emit_sub (p, sp, sp, immediate_operand (31 * 16));
2365   for (i = 30; i >= 0; i -= 1)
2366     p += emit_str (p, aarch64_register (i, 1), sp,
2367                    offset_memory_operand (i * 16));
2368
2369   /* Make space for 5 more cells.
2370
2371        SUB sp, sp, #(5 * 16)
2372
2373      */
2374   p += emit_sub (p, sp, sp, immediate_operand (5 * 16));
2375
2376
2377   /* Save SP:
2378
2379        ADD x4, sp, #((32 + 31 + 5) * 16)
2380        STR x4, [sp, #(4 * 16)]
2381
2382      */
2383   p += emit_add (p, x4, sp, immediate_operand ((32 + 31 + 5) * 16));
2384   p += emit_str (p, x4, sp, offset_memory_operand (4 * 16));
2385
2386   /* Save PC (tracepoint address):
2387
2388        MOV  x3, #(tpaddr)
2389        ...
2390
2391        STR x3, [sp, #(3 * 16)]
2392
2393      */
2394
2395   p += emit_mov_addr (p, x3, tpaddr);
2396   p += emit_str (p, x3, sp, offset_memory_operand (3 * 16));
2397
2398   /* Save CPSR (NZCV), FPSR and FPCR:
2399
2400        MRS x2, nzcv
2401        MRS x1, fpsr
2402        MRS x0, fpcr
2403
2404        STR x2, [sp, #(2 * 16)]
2405        STR x1, [sp, #(1 * 16)]
2406        STR x0, [sp, #(0 * 16)]
2407
2408      */
2409   p += emit_mrs (p, x2, NZCV);
2410   p += emit_mrs (p, x1, FPSR);
2411   p += emit_mrs (p, x0, FPCR);
2412   p += emit_str (p, x2, sp, offset_memory_operand (2 * 16));
2413   p += emit_str (p, x1, sp, offset_memory_operand (1 * 16));
2414   p += emit_str (p, x0, sp, offset_memory_operand (0 * 16));
2415
2416   /* Push the collecting_t object.  It consist of the address of the
2417      tracepoint and an ID for the current thread.  We get the latter by
2418      reading the tpidr_el0 system register.  It corresponds to the
2419      NT_ARM_TLS register accessible with ptrace.
2420
2421        MOV x0, #(tpoint)
2422        ...
2423
2424        MRS x1, tpidr_el0
2425
2426        STP x0, x1, [sp, #-16]!
2427
2428      */
2429
2430   p += emit_mov_addr (p, x0, tpoint);
2431   p += emit_mrs (p, x1, TPIDR_EL0);
2432   p += emit_stp (p, x0, x1, sp, preindex_memory_operand (-16));
2433
2434   /* Spin-lock:
2435
2436      The shared memory for the lock is at lockaddr.  It will hold zero
2437      if no-one is holding the lock, otherwise it contains the address of
2438      the collecting_t object on the stack of the thread which acquired it.
2439
2440      At this stage, the stack pointer points to this thread's collecting_t
2441      object.
2442
2443      We use the following registers:
2444      - x0: Address of the lock.
2445      - x1: Pointer to collecting_t object.
2446      - x2: Scratch register.
2447
2448        MOV x0, #(lockaddr)
2449        ...
2450        MOV x1, sp
2451
2452        ; Trigger an event local to this core.  So the following WFE
2453        ; instruction is ignored.
2454        SEVL
2455      again:
2456        ; Wait for an event.  The event is triggered by either the SEVL
2457        ; or STLR instructions (store release).
2458        WFE
2459
2460        ; Atomically read at lockaddr.  This marks the memory location as
2461        ; exclusive.  This instruction also has memory constraints which
2462        ; make sure all previous data reads and writes are done before
2463        ; executing it.
2464        LDAXR x2, [x0]
2465
2466        ; Try again if another thread holds the lock.
2467        CBNZ x2, again
2468
2469        ; We can lock it!  Write the address of the collecting_t object.
2470        ; This instruction will fail if the memory location is not marked
2471        ; as exclusive anymore.  If it succeeds, it will remove the
2472        ; exclusive mark on the memory location.  This way, if another
2473        ; thread executes this instruction before us, we will fail and try
2474        ; all over again.
2475        STXR w2, x1, [x0]
2476        CBNZ w2, again
2477
2478      */
2479
2480   p += emit_mov_addr (p, x0, lockaddr);
2481   p += emit_mov (p, x1, register_operand (sp));
2482
2483   p += emit_sevl (p);
2484   p += emit_wfe (p);
2485   p += emit_ldaxr (p, x2, x0);
2486   p += emit_cb (p, 1, w2, -2 * 4);
2487   p += emit_stxr (p, w2, x1, x0);
2488   p += emit_cb (p, 1, x2, -4 * 4);
2489
2490   /* Call collector (struct tracepoint *, unsigned char *):
2491
2492        MOV x0, #(tpoint)
2493        ...
2494
2495        ; Saved registers start after the collecting_t object.
2496        ADD x1, sp, #16
2497
2498        ; We use an intra-procedure-call scratch register.
2499        MOV ip0, #(collector)
2500        ...
2501
2502        ; And call back to C!
2503        BLR ip0
2504
2505      */
2506
2507   p += emit_mov_addr (p, x0, tpoint);
2508   p += emit_add (p, x1, sp, immediate_operand (16));
2509
2510   p += emit_mov_addr (p, ip0, collector);
2511   p += emit_blr (p, ip0);
2512
2513   /* Release the lock.
2514
2515        MOV x0, #(lockaddr)
2516        ...
2517
2518        ; This instruction is a normal store with memory ordering
2519        ; constraints.  Thanks to this we do not have to put a data
2520        ; barrier instruction to make sure all data read and writes are done
2521        ; before this instruction is executed.  Furthermore, this instruction
2522        ; will trigger an event, letting other threads know they can grab
2523        ; the lock.
2524        STLR xzr, [x0]
2525
2526      */
2527   p += emit_mov_addr (p, x0, lockaddr);
2528   p += emit_stlr (p, xzr, x0);
2529
2530   /* Free collecting_t object:
2531
2532        ADD sp, sp, #16
2533
2534      */
2535   p += emit_add (p, sp, sp, immediate_operand (16));
2536
2537   /* Restore CPSR (NZCV), FPSR and FPCR.  And free all special purpose
2538      registers from the stack.
2539
2540        LDR x2, [sp, #(2 * 16)]
2541        LDR x1, [sp, #(1 * 16)]
2542        LDR x0, [sp, #(0 * 16)]
2543
2544        MSR NZCV, x2
2545        MSR FPSR, x1
2546        MSR FPCR, x0
2547
2548        ADD sp, sp #(5 * 16)
2549
2550      */
2551   p += emit_ldr (p, x2, sp, offset_memory_operand (2 * 16));
2552   p += emit_ldr (p, x1, sp, offset_memory_operand (1 * 16));
2553   p += emit_ldr (p, x0, sp, offset_memory_operand (0 * 16));
2554   p += emit_msr (p, NZCV, x2);
2555   p += emit_msr (p, FPSR, x1);
2556   p += emit_msr (p, FPCR, x0);
2557
2558   p += emit_add (p, sp, sp, immediate_operand (5 * 16));
2559
2560   /* Pop general purpose registers:
2561
2562        LDR x0, [sp]
2563        ...
2564        LDR x30, [sp, #(30 * 16)]
2565
2566        ADD sp, sp, #(31 * 16)
2567
2568      */
2569   for (i = 0; i <= 30; i += 1)
2570     p += emit_ldr (p, aarch64_register (i, 1), sp,
2571                    offset_memory_operand (i * 16));
2572   p += emit_add (p, sp, sp, immediate_operand (31 * 16));
2573
2574   /* Pop SIMD&FP registers:
2575
2576        LDP q0, q1, [sp]
2577        ...
2578        LDP q30, q31, [sp, #(30 * 16)]
2579
2580        ADD sp, sp, #(32 * 16)
2581
2582      */
2583   for (i = 0; i <= 30; i += 2)
2584     p += emit_ldp_q_offset (p, i, i + 1, sp, i * 16);
2585   p += emit_add (p, sp, sp, immediate_operand (32 * 16));
2586
2587   /* Write the code into the inferior memory.  */
2588   append_insns (&buildaddr, p - buf, buf);
2589
2590   /* Now emit the relocated instruction.  */
2591   *adjusted_insn_addr = buildaddr;
2592   target_read_uint32 (tpaddr, &insn);
2593
2594   insn_data.base.insn_addr = tpaddr;
2595   insn_data.new_addr = buildaddr;
2596   insn_data.insn_ptr = buf;
2597
2598   aarch64_relocate_instruction (insn, &visitor,
2599                                 (struct aarch64_insn_data *) &insn_data);
2600
2601   /* We may not have been able to relocate the instruction.  */
2602   if (insn_data.insn_ptr == buf)
2603     {
2604       sprintf (err,
2605                "E.Could not relocate instruction from %s to %s.",
2606                core_addr_to_string_nz (tpaddr),
2607                core_addr_to_string_nz (buildaddr));
2608       return 1;
2609     }
2610   else
2611     append_insns (&buildaddr, insn_data.insn_ptr - buf, buf);
2612   *adjusted_insn_addr_end = buildaddr;
2613
2614   /* Go back to the start of the buffer.  */
2615   p = buf;
2616
2617   /* Emit a branch back from the jump pad.  */
2618   offset = (tpaddr + orig_size - buildaddr);
2619   if (!can_encode_int32 (offset, 28))
2620     {
2621       sprintf (err,
2622                "E.Jump back from jump pad too far from tracepoint "
2623                "(offset 0x%" PRIx64 " cannot be encoded in 28 bits).",
2624                offset);
2625       return 1;
2626     }
2627
2628   p += emit_b (p, 0, offset);
2629   append_insns (&buildaddr, p - buf, buf);
2630
2631   /* Give the caller a branch instruction into the jump pad.  */
2632   offset = (*jump_entry - tpaddr);
2633   if (!can_encode_int32 (offset, 28))
2634     {
2635       sprintf (err,
2636                "E.Jump pad too far from tracepoint "
2637                "(offset 0x%" PRIx64 " cannot be encoded in 28 bits).",
2638                offset);
2639       return 1;
2640     }
2641
2642   emit_b ((uint32_t *) jjump_pad_insn, 0, offset);
2643   *jjump_pad_insn_size = 4;
2644
2645   /* Return the end address of our pad.  */
2646   *jump_entry = buildaddr;
2647
2648   return 0;
2649 }
2650
2651 /* Helper function writing LEN instructions from START into
2652    current_insn_ptr.  */
2653
2654 static void
2655 emit_ops_insns (const uint32_t *start, int len)
2656 {
2657   CORE_ADDR buildaddr = current_insn_ptr;
2658
2659   threads_debug_printf ("Adding %d instructions at %s",
2660                         len, paddress (buildaddr));
2661
2662   append_insns (&buildaddr, len, start);
2663   current_insn_ptr = buildaddr;
2664 }
2665
2666 /* Pop a register from the stack.  */
2667
2668 static int
2669 emit_pop (uint32_t *buf, struct aarch64_register rt)
2670 {
2671   return emit_ldr (buf, rt, sp, postindex_memory_operand (1 * 16));
2672 }
2673
2674 /* Push a register on the stack.  */
2675
2676 static int
2677 emit_push (uint32_t *buf, struct aarch64_register rt)
2678 {
2679   return emit_str (buf, rt, sp, preindex_memory_operand (-1 * 16));
2680 }
2681
2682 /* Implementation of emit_ops method "emit_prologue".  */
2683
2684 static void
2685 aarch64_emit_prologue (void)
2686 {
2687   uint32_t buf[16];
2688   uint32_t *p = buf;
2689
2690   /* This function emit a prologue for the following function prototype:
2691
2692      enum eval_result_type f (unsigned char *regs,
2693                               ULONGEST *value);
2694
2695      The first argument is a buffer of raw registers.  The second
2696      argument is the result of
2697      evaluating the expression, which will be set to whatever is on top of
2698      the stack at the end.
2699
2700      The stack set up by the prologue is as such:
2701
2702      High *------------------------------------------------------*
2703           | LR                                                   |
2704           | FP                                                   | <- FP
2705           | x1  (ULONGEST *value)                                |
2706           | x0  (unsigned char *regs)                            |
2707      Low  *------------------------------------------------------*
2708
2709      As we are implementing a stack machine, each opcode can expand the
2710      stack so we never know how far we are from the data saved by this
2711      prologue.  In order to be able refer to value and regs later, we save
2712      the current stack pointer in the frame pointer.  This way, it is not
2713      clobbered when calling C functions.
2714
2715      Finally, throughout every operation, we are using register x0 as the
2716      top of the stack, and x1 as a scratch register.  */
2717
2718   p += emit_stp (p, x0, x1, sp, preindex_memory_operand (-2 * 16));
2719   p += emit_str (p, lr, sp, offset_memory_operand (3 * 8));
2720   p += emit_str (p, fp, sp, offset_memory_operand (2 * 8));
2721
2722   p += emit_add (p, fp, sp, immediate_operand (2 * 8));
2723
2724
2725   emit_ops_insns (buf, p - buf);
2726 }
2727
2728 /* Implementation of emit_ops method "emit_epilogue".  */
2729
2730 static void
2731 aarch64_emit_epilogue (void)
2732 {
2733   uint32_t buf[16];
2734   uint32_t *p = buf;
2735
2736   /* Store the result of the expression (x0) in *value.  */
2737   p += emit_sub (p, x1, fp, immediate_operand (1 * 8));
2738   p += emit_ldr (p, x1, x1, offset_memory_operand (0));
2739   p += emit_str (p, x0, x1, offset_memory_operand (0));
2740
2741   /* Restore the previous state.  */
2742   p += emit_add (p, sp, fp, immediate_operand (2 * 8));
2743   p += emit_ldp (p, fp, lr, fp, offset_memory_operand (0));
2744
2745   /* Return expr_eval_no_error.  */
2746   p += emit_mov (p, x0, immediate_operand (expr_eval_no_error));
2747   p += emit_ret (p, lr);
2748
2749   emit_ops_insns (buf, p - buf);
2750 }
2751
2752 /* Implementation of emit_ops method "emit_add".  */
2753
2754 static void
2755 aarch64_emit_add (void)
2756 {
2757   uint32_t buf[16];
2758   uint32_t *p = buf;
2759
2760   p += emit_pop (p, x1);
2761   p += emit_add (p, x0, x1, register_operand (x0));
2762
2763   emit_ops_insns (buf, p - buf);
2764 }
2765
2766 /* Implementation of emit_ops method "emit_sub".  */
2767
2768 static void
2769 aarch64_emit_sub (void)
2770 {
2771   uint32_t buf[16];
2772   uint32_t *p = buf;
2773
2774   p += emit_pop (p, x1);
2775   p += emit_sub (p, x0, x1, register_operand (x0));
2776
2777   emit_ops_insns (buf, p - buf);
2778 }
2779
2780 /* Implementation of emit_ops method "emit_mul".  */
2781
2782 static void
2783 aarch64_emit_mul (void)
2784 {
2785   uint32_t buf[16];
2786   uint32_t *p = buf;
2787
2788   p += emit_pop (p, x1);
2789   p += emit_mul (p, x0, x1, x0);
2790
2791   emit_ops_insns (buf, p - buf);
2792 }
2793
2794 /* Implementation of emit_ops method "emit_lsh".  */
2795
2796 static void
2797 aarch64_emit_lsh (void)
2798 {
2799   uint32_t buf[16];
2800   uint32_t *p = buf;
2801
2802   p += emit_pop (p, x1);
2803   p += emit_lslv (p, x0, x1, x0);
2804
2805   emit_ops_insns (buf, p - buf);
2806 }
2807
2808 /* Implementation of emit_ops method "emit_rsh_signed".  */
2809
2810 static void
2811 aarch64_emit_rsh_signed (void)
2812 {
2813   uint32_t buf[16];
2814   uint32_t *p = buf;
2815
2816   p += emit_pop (p, x1);
2817   p += emit_asrv (p, x0, x1, x0);
2818
2819   emit_ops_insns (buf, p - buf);
2820 }
2821
2822 /* Implementation of emit_ops method "emit_rsh_unsigned".  */
2823
2824 static void
2825 aarch64_emit_rsh_unsigned (void)
2826 {
2827   uint32_t buf[16];
2828   uint32_t *p = buf;
2829
2830   p += emit_pop (p, x1);
2831   p += emit_lsrv (p, x0, x1, x0);
2832
2833   emit_ops_insns (buf, p - buf);
2834 }
2835
2836 /* Implementation of emit_ops method "emit_ext".  */
2837
2838 static void
2839 aarch64_emit_ext (int arg)
2840 {
2841   uint32_t buf[16];
2842   uint32_t *p = buf;
2843
2844   p += emit_sbfx (p, x0, x0, 0, arg);
2845
2846   emit_ops_insns (buf, p - buf);
2847 }
2848
2849 /* Implementation of emit_ops method "emit_log_not".  */
2850
2851 static void
2852 aarch64_emit_log_not (void)
2853 {
2854   uint32_t buf[16];
2855   uint32_t *p = buf;
2856
2857   /* If the top of the stack is 0, replace it with 1.  Else replace it with
2858      0.  */
2859
2860   p += emit_cmp (p, x0, immediate_operand (0));
2861   p += emit_cset (p, x0, EQ);
2862
2863   emit_ops_insns (buf, p - buf);
2864 }
2865
2866 /* Implementation of emit_ops method "emit_bit_and".  */
2867
2868 static void
2869 aarch64_emit_bit_and (void)
2870 {
2871   uint32_t buf[16];
2872   uint32_t *p = buf;
2873
2874   p += emit_pop (p, x1);
2875   p += emit_and (p, x0, x0, x1);
2876
2877   emit_ops_insns (buf, p - buf);
2878 }
2879
2880 /* Implementation of emit_ops method "emit_bit_or".  */
2881
2882 static void
2883 aarch64_emit_bit_or (void)
2884 {
2885   uint32_t buf[16];
2886   uint32_t *p = buf;
2887
2888   p += emit_pop (p, x1);
2889   p += emit_orr (p, x0, x0, x1);
2890
2891   emit_ops_insns (buf, p - buf);
2892 }
2893
2894 /* Implementation of emit_ops method "emit_bit_xor".  */
2895
2896 static void
2897 aarch64_emit_bit_xor (void)
2898 {
2899   uint32_t buf[16];
2900   uint32_t *p = buf;
2901
2902   p += emit_pop (p, x1);
2903   p += emit_eor (p, x0, x0, x1);
2904
2905   emit_ops_insns (buf, p - buf);
2906 }
2907
2908 /* Implementation of emit_ops method "emit_bit_not".  */
2909
2910 static void
2911 aarch64_emit_bit_not (void)
2912 {
2913   uint32_t buf[16];
2914   uint32_t *p = buf;
2915
2916   p += emit_mvn (p, x0, x0);
2917
2918   emit_ops_insns (buf, p - buf);
2919 }
2920
2921 /* Implementation of emit_ops method "emit_equal".  */
2922
2923 static void
2924 aarch64_emit_equal (void)
2925 {
2926   uint32_t buf[16];
2927   uint32_t *p = buf;
2928
2929   p += emit_pop (p, x1);
2930   p += emit_cmp (p, x0, register_operand (x1));
2931   p += emit_cset (p, x0, EQ);
2932
2933   emit_ops_insns (buf, p - buf);
2934 }
2935
2936 /* Implementation of emit_ops method "emit_less_signed".  */
2937
2938 static void
2939 aarch64_emit_less_signed (void)
2940 {
2941   uint32_t buf[16];
2942   uint32_t *p = buf;
2943
2944   p += emit_pop (p, x1);
2945   p += emit_cmp (p, x1, register_operand (x0));
2946   p += emit_cset (p, x0, LT);
2947
2948   emit_ops_insns (buf, p - buf);
2949 }
2950
2951 /* Implementation of emit_ops method "emit_less_unsigned".  */
2952
2953 static void
2954 aarch64_emit_less_unsigned (void)
2955 {
2956   uint32_t buf[16];
2957   uint32_t *p = buf;
2958
2959   p += emit_pop (p, x1);
2960   p += emit_cmp (p, x1, register_operand (x0));
2961   p += emit_cset (p, x0, LO);
2962
2963   emit_ops_insns (buf, p - buf);
2964 }
2965
2966 /* Implementation of emit_ops method "emit_ref".  */
2967
2968 static void
2969 aarch64_emit_ref (int size)
2970 {
2971   uint32_t buf[16];
2972   uint32_t *p = buf;
2973
2974   switch (size)
2975     {
2976     case 1:
2977       p += emit_ldrb (p, w0, x0, offset_memory_operand (0));
2978       break;
2979     case 2:
2980       p += emit_ldrh (p, w0, x0, offset_memory_operand (0));
2981       break;
2982     case 4:
2983       p += emit_ldr (p, w0, x0, offset_memory_operand (0));
2984       break;
2985     case 8:
2986       p += emit_ldr (p, x0, x0, offset_memory_operand (0));
2987       break;
2988     default:
2989       /* Unknown size, bail on compilation.  */
2990       emit_error = 1;
2991       break;
2992     }
2993
2994   emit_ops_insns (buf, p - buf);
2995 }
2996
2997 /* Implementation of emit_ops method "emit_if_goto".  */
2998
2999 static void
3000 aarch64_emit_if_goto (int *offset_p, int *size_p)
3001 {
3002   uint32_t buf[16];
3003   uint32_t *p = buf;
3004
3005   /* The Z flag is set or cleared here.  */
3006   p += emit_cmp (p, x0, immediate_operand (0));
3007   /* This instruction must not change the Z flag.  */
3008   p += emit_pop (p, x0);
3009   /* Branch over the next instruction if x0 == 0.  */
3010   p += emit_bcond (p, EQ, 8);
3011
3012   /* The NOP instruction will be patched with an unconditional branch.  */
3013   if (offset_p)
3014     *offset_p = (p - buf) * 4;
3015   if (size_p)
3016     *size_p = 4;
3017   p += emit_nop (p);
3018
3019   emit_ops_insns (buf, p - buf);
3020 }
3021
3022 /* Implementation of emit_ops method "emit_goto".  */
3023
3024 static void
3025 aarch64_emit_goto (int *offset_p, int *size_p)
3026 {
3027   uint32_t buf[16];
3028   uint32_t *p = buf;
3029
3030   /* The NOP instruction will be patched with an unconditional branch.  */
3031   if (offset_p)
3032     *offset_p = 0;
3033   if (size_p)
3034     *size_p = 4;
3035   p += emit_nop (p);
3036
3037   emit_ops_insns (buf, p - buf);
3038 }
3039
3040 /* Implementation of emit_ops method "write_goto_address".  */
3041
3042 static void
3043 aarch64_write_goto_address (CORE_ADDR from, CORE_ADDR to, int size)
3044 {
3045   uint32_t insn;
3046
3047   emit_b (&insn, 0, to - from);
3048   append_insns (&from, 1, &insn);
3049 }
3050
3051 /* Implementation of emit_ops method "emit_const".  */
3052
3053 static void
3054 aarch64_emit_const (LONGEST num)
3055 {
3056   uint32_t buf[16];
3057   uint32_t *p = buf;
3058
3059   p += emit_mov_addr (p, x0, num);
3060
3061   emit_ops_insns (buf, p - buf);
3062 }
3063
3064 /* Implementation of emit_ops method "emit_call".  */
3065
3066 static void
3067 aarch64_emit_call (CORE_ADDR fn)
3068 {
3069   uint32_t buf[16];
3070   uint32_t *p = buf;
3071
3072   p += emit_mov_addr (p, ip0, fn);
3073   p += emit_blr (p, ip0);
3074
3075   emit_ops_insns (buf, p - buf);
3076 }
3077
3078 /* Implementation of emit_ops method "emit_reg".  */
3079
3080 static void
3081 aarch64_emit_reg (int reg)
3082 {
3083   uint32_t buf[16];
3084   uint32_t *p = buf;
3085
3086   /* Set x0 to unsigned char *regs.  */
3087   p += emit_sub (p, x0, fp, immediate_operand (2 * 8));
3088   p += emit_ldr (p, x0, x0, offset_memory_operand (0));
3089   p += emit_mov (p, x1, immediate_operand (reg));
3090
3091   emit_ops_insns (buf, p - buf);
3092
3093   aarch64_emit_call (get_raw_reg_func_addr ());
3094 }
3095
3096 /* Implementation of emit_ops method "emit_pop".  */
3097
3098 static void
3099 aarch64_emit_pop (void)
3100 {
3101   uint32_t buf[16];
3102   uint32_t *p = buf;
3103
3104   p += emit_pop (p, x0);
3105
3106   emit_ops_insns (buf, p - buf);
3107 }
3108
3109 /* Implementation of emit_ops method "emit_stack_flush".  */
3110
3111 static void
3112 aarch64_emit_stack_flush (void)
3113 {
3114   uint32_t buf[16];
3115   uint32_t *p = buf;
3116
3117   p += emit_push (p, x0);
3118
3119   emit_ops_insns (buf, p - buf);
3120 }
3121
3122 /* Implementation of emit_ops method "emit_zero_ext".  */
3123
3124 static void
3125 aarch64_emit_zero_ext (int arg)
3126 {
3127   uint32_t buf[16];
3128   uint32_t *p = buf;
3129
3130   p += emit_ubfx (p, x0, x0, 0, arg);
3131
3132   emit_ops_insns (buf, p - buf);
3133 }
3134
3135 /* Implementation of emit_ops method "emit_swap".  */
3136
3137 static void
3138 aarch64_emit_swap (void)
3139 {
3140   uint32_t buf[16];
3141   uint32_t *p = buf;
3142
3143   p += emit_ldr (p, x1, sp, offset_memory_operand (0 * 16));
3144   p += emit_str (p, x0, sp, offset_memory_operand (0 * 16));
3145   p += emit_mov (p, x0, register_operand (x1));
3146
3147   emit_ops_insns (buf, p - buf);
3148 }
3149
3150 /* Implementation of emit_ops method "emit_stack_adjust".  */
3151
3152 static void
3153 aarch64_emit_stack_adjust (int n)
3154 {
3155   /* This is not needed with our design.  */
3156   uint32_t buf[16];
3157   uint32_t *p = buf;
3158
3159   p += emit_add (p, sp, sp, immediate_operand (n * 16));
3160
3161   emit_ops_insns (buf, p - buf);
3162 }
3163
3164 /* Implementation of emit_ops method "emit_int_call_1".  */
3165
3166 static void
3167 aarch64_emit_int_call_1 (CORE_ADDR fn, int arg1)
3168 {
3169   uint32_t buf[16];
3170   uint32_t *p = buf;
3171
3172   p += emit_mov (p, x0, immediate_operand (arg1));
3173
3174   emit_ops_insns (buf, p - buf);
3175
3176   aarch64_emit_call (fn);
3177 }
3178
3179 /* Implementation of emit_ops method "emit_void_call_2".  */
3180
3181 static void
3182 aarch64_emit_void_call_2 (CORE_ADDR fn, int arg1)
3183 {
3184   uint32_t buf[16];
3185   uint32_t *p = buf;
3186
3187   /* Push x0 on the stack.  */
3188   aarch64_emit_stack_flush ();
3189
3190   /* Setup arguments for the function call:
3191
3192      x0: arg1
3193      x1: top of the stack
3194
3195        MOV x1, x0
3196        MOV x0, #arg1  */
3197
3198   p += emit_mov (p, x1, register_operand (x0));
3199   p += emit_mov (p, x0, immediate_operand (arg1));
3200
3201   emit_ops_insns (buf, p - buf);
3202
3203   aarch64_emit_call (fn);
3204
3205   /* Restore x0.  */
3206   aarch64_emit_pop ();
3207 }
3208
3209 /* Implementation of emit_ops method "emit_eq_goto".  */
3210
3211 static void
3212 aarch64_emit_eq_goto (int *offset_p, int *size_p)
3213 {
3214   uint32_t buf[16];
3215   uint32_t *p = buf;
3216
3217   p += emit_pop (p, x1);
3218   p += emit_cmp (p, x1, register_operand (x0));
3219   /* Branch over the next instruction if x0 != x1.  */
3220   p += emit_bcond (p, NE, 8);
3221   /* The NOP instruction will be patched with an unconditional branch.  */
3222   if (offset_p)
3223     *offset_p = (p - buf) * 4;
3224   if (size_p)
3225     *size_p = 4;
3226   p += emit_nop (p);
3227
3228   emit_ops_insns (buf, p - buf);
3229 }
3230
3231 /* Implementation of emit_ops method "emit_ne_goto".  */
3232
3233 static void
3234 aarch64_emit_ne_goto (int *offset_p, int *size_p)
3235 {
3236   uint32_t buf[16];
3237   uint32_t *p = buf;
3238
3239   p += emit_pop (p, x1);
3240   p += emit_cmp (p, x1, register_operand (x0));
3241   /* Branch over the next instruction if x0 == x1.  */
3242   p += emit_bcond (p, EQ, 8);
3243   /* The NOP instruction will be patched with an unconditional branch.  */
3244   if (offset_p)
3245     *offset_p = (p - buf) * 4;
3246   if (size_p)
3247     *size_p = 4;
3248   p += emit_nop (p);
3249
3250   emit_ops_insns (buf, p - buf);
3251 }
3252
3253 /* Implementation of emit_ops method "emit_lt_goto".  */
3254
3255 static void
3256 aarch64_emit_lt_goto (int *offset_p, int *size_p)
3257 {
3258   uint32_t buf[16];
3259   uint32_t *p = buf;
3260
3261   p += emit_pop (p, x1);
3262   p += emit_cmp (p, x1, register_operand (x0));
3263   /* Branch over the next instruction if x0 >= x1.  */
3264   p += emit_bcond (p, GE, 8);
3265   /* The NOP instruction will be patched with an unconditional branch.  */
3266   if (offset_p)
3267     *offset_p = (p - buf) * 4;
3268   if (size_p)
3269     *size_p = 4;
3270   p += emit_nop (p);
3271
3272   emit_ops_insns (buf, p - buf);
3273 }
3274
3275 /* Implementation of emit_ops method "emit_le_goto".  */
3276
3277 static void
3278 aarch64_emit_le_goto (int *offset_p, int *size_p)
3279 {
3280   uint32_t buf[16];
3281   uint32_t *p = buf;
3282
3283   p += emit_pop (p, x1);
3284   p += emit_cmp (p, x1, register_operand (x0));
3285   /* Branch over the next instruction if x0 > x1.  */
3286   p += emit_bcond (p, GT, 8);
3287   /* The NOP instruction will be patched with an unconditional branch.  */
3288   if (offset_p)
3289     *offset_p = (p - buf) * 4;
3290   if (size_p)
3291     *size_p = 4;
3292   p += emit_nop (p);
3293
3294   emit_ops_insns (buf, p - buf);
3295 }
3296
3297 /* Implementation of emit_ops method "emit_gt_goto".  */
3298
3299 static void
3300 aarch64_emit_gt_goto (int *offset_p, int *size_p)
3301 {
3302   uint32_t buf[16];
3303   uint32_t *p = buf;
3304
3305   p += emit_pop (p, x1);
3306   p += emit_cmp (p, x1, register_operand (x0));
3307   /* Branch over the next instruction if x0 <= x1.  */
3308   p += emit_bcond (p, LE, 8);
3309   /* The NOP instruction will be patched with an unconditional branch.  */
3310   if (offset_p)
3311     *offset_p = (p - buf) * 4;
3312   if (size_p)
3313     *size_p = 4;
3314   p += emit_nop (p);
3315
3316   emit_ops_insns (buf, p - buf);
3317 }
3318
3319 /* Implementation of emit_ops method "emit_ge_got".  */
3320
3321 static void
3322 aarch64_emit_ge_got (int *offset_p, int *size_p)
3323 {
3324   uint32_t buf[16];
3325   uint32_t *p = buf;
3326
3327   p += emit_pop (p, x1);
3328   p += emit_cmp (p, x1, register_operand (x0));
3329   /* Branch over the next instruction if x0 <= x1.  */
3330   p += emit_bcond (p, LT, 8);
3331   /* The NOP instruction will be patched with an unconditional branch.  */
3332   if (offset_p)
3333     *offset_p = (p - buf) * 4;
3334   if (size_p)
3335     *size_p = 4;
3336   p += emit_nop (p);
3337
3338   emit_ops_insns (buf, p - buf);
3339 }
3340
3341 static struct emit_ops aarch64_emit_ops_impl =
3342 {
3343   aarch64_emit_prologue,
3344   aarch64_emit_epilogue,
3345   aarch64_emit_add,
3346   aarch64_emit_sub,
3347   aarch64_emit_mul,
3348   aarch64_emit_lsh,
3349   aarch64_emit_rsh_signed,
3350   aarch64_emit_rsh_unsigned,
3351   aarch64_emit_ext,
3352   aarch64_emit_log_not,
3353   aarch64_emit_bit_and,
3354   aarch64_emit_bit_or,
3355   aarch64_emit_bit_xor,
3356   aarch64_emit_bit_not,
3357   aarch64_emit_equal,
3358   aarch64_emit_less_signed,
3359   aarch64_emit_less_unsigned,
3360   aarch64_emit_ref,
3361   aarch64_emit_if_goto,
3362   aarch64_emit_goto,
3363   aarch64_write_goto_address,
3364   aarch64_emit_const,
3365   aarch64_emit_call,
3366   aarch64_emit_reg,
3367   aarch64_emit_pop,
3368   aarch64_emit_stack_flush,
3369   aarch64_emit_zero_ext,
3370   aarch64_emit_swap,
3371   aarch64_emit_stack_adjust,
3372   aarch64_emit_int_call_1,
3373   aarch64_emit_void_call_2,
3374   aarch64_emit_eq_goto,
3375   aarch64_emit_ne_goto,
3376   aarch64_emit_lt_goto,
3377   aarch64_emit_le_goto,
3378   aarch64_emit_gt_goto,
3379   aarch64_emit_ge_got,
3380 };
3381
3382 /* Implementation of target ops method "emit_ops".  */
3383
3384 emit_ops *
3385 aarch64_target::emit_ops ()
3386 {
3387   return &aarch64_emit_ops_impl;
3388 }
3389
3390 /* Implementation of target ops method
3391    "get_min_fast_tracepoint_insn_len".  */
3392
3393 int
3394 aarch64_target::get_min_fast_tracepoint_insn_len ()
3395 {
3396   return 4;
3397 }
3398
3399 /* Implementation of linux target ops method "low_supports_range_stepping".  */
3400
3401 bool
3402 aarch64_target::low_supports_range_stepping ()
3403 {
3404   return true;
3405 }
3406
3407 /* Implementation of target ops method "sw_breakpoint_from_kind".  */
3408
3409 const gdb_byte *
3410 aarch64_target::sw_breakpoint_from_kind (int kind, int *size)
3411 {
3412   if (is_64bit_tdesc ())
3413     {
3414       *size = aarch64_breakpoint_len;
3415       return aarch64_breakpoint;
3416     }
3417   else
3418     return arm_sw_breakpoint_from_kind (kind, size);
3419 }
3420
3421 /* Implementation of target ops method "breakpoint_kind_from_pc".  */
3422
3423 int
3424 aarch64_target::breakpoint_kind_from_pc (CORE_ADDR *pcptr)
3425 {
3426   if (is_64bit_tdesc ())
3427     return aarch64_breakpoint_len;
3428   else
3429     return arm_breakpoint_kind_from_pc (pcptr);
3430 }
3431
3432 /* Implementation of the target ops method
3433    "breakpoint_kind_from_current_state".  */
3434
3435 int
3436 aarch64_target::breakpoint_kind_from_current_state (CORE_ADDR *pcptr)
3437 {
3438   if (is_64bit_tdesc ())
3439     return aarch64_breakpoint_len;
3440   else
3441     return arm_breakpoint_kind_from_current_state (pcptr);
3442 }
3443
3444 /* Returns true if memory tagging is supported.  */
3445 bool
3446 aarch64_target::supports_memory_tagging ()
3447 {
3448   if (current_thread == NULL)
3449     {
3450       /* We don't have any processes running, so don't attempt to
3451          use linux_get_hwcap2 as it will try to fetch the current
3452          thread id.  Instead, just fetch the auxv from the self
3453          PID.  */
3454 #ifdef HAVE_GETAUXVAL
3455       return (getauxval (AT_HWCAP2) & HWCAP2_MTE) != 0;
3456 #else
3457       return true;
3458 #endif
3459     }
3460
3461   return (linux_get_hwcap2 (current_thread->id.pid (), 8) & HWCAP2_MTE) != 0;
3462 }
3463
3464 bool
3465 aarch64_target::fetch_memtags (CORE_ADDR address, size_t len,
3466                                gdb::byte_vector &tags, int type)
3467 {
3468   /* Allocation tags are per-process, so any tid is fine.  */
3469   int tid = lwpid_of (current_thread);
3470
3471   /* Allocation tag?  */
3472   if (type == static_cast <int> (aarch64_memtag_type::mte_allocation))
3473     return aarch64_mte_fetch_memtags (tid, address, len, tags);
3474
3475   return false;
3476 }
3477
3478 bool
3479 aarch64_target::store_memtags (CORE_ADDR address, size_t len,
3480                                const gdb::byte_vector &tags, int type)
3481 {
3482   /* Allocation tags are per-process, so any tid is fine.  */
3483   int tid = lwpid_of (current_thread);
3484
3485   /* Allocation tag?  */
3486   if (type == static_cast <int> (aarch64_memtag_type::mte_allocation))
3487     return aarch64_mte_store_memtags (tid, address, len, tags);
3488
3489   return false;
3490 }
3491
3492 /* The linux target ops object.  */
3493
3494 linux_process_target *the_linux_target = &the_aarch64_target;
3495
3496 void
3497 initialize_low_arch (void)
3498 {
3499   initialize_low_arch_aarch32 ();
3500
3501   initialize_regsets_info (&aarch64_regsets_info);
3502 }