Replace write_inferior_memory with target_write_memory

[thirdparty/binutils-gdb.git] / gdb / gdbserver / linux-aarch64-low.c
diff --git a/gdb/gdbserver/linux-aarch64-low.c b/gdb/gdbserver/linux-aarch64-low.c

index 506fb9e11e7fd540723e242f1a49aa2caaca2d5b..33095ea752d5fee69e66b814dc865d8c876a5085 100644 (file)
--- a/gdb/gdbserver/linux-aarch64-low.c
+++ b/gdb/gdbserver/linux-aarch64-low.c
@@ -1,7 +1,7 @@
  /* GNU/Linux/AArch64 specific low level interface, for the remote server for
     GDB.
  
-   Copyright (C) 2009-2015 Free Software Foundation, Inc.
+   Copyright (C) 2009-2019 Free Software Foundation, Inc.
     Contributed by ARM Ltd.
  
     This file is part of GDB.
@@ -38,27 +38,16 @@
  #include <sys/uio.h>
  
  #include "gdb_proc_service.h"
-
-/* Defined in auto-generated files.  */
-void init_registers_aarch64 (void);
-extern const struct target_desc *tdesc_aarch64;
+#include "arch/aarch64.h"
+#include "linux-aarch32-tdesc.h"
+#include "linux-aarch64-tdesc.h"
+#include "nat/aarch64-sve-linux-ptrace.h"
+#include "tdesc.h"
  
  #ifdef HAVE_SYS_REG_H
  #include <sys/reg.h>
  #endif
  
-#define AARCH64_X_REGS_NUM 31
-#define AARCH64_V_REGS_NUM 32
-#define AARCH64_X0_REGNO    0
-#define AARCH64_SP_REGNO   31
-#define AARCH64_PC_REGNO   32
-#define AARCH64_CPSR_REGNO 33
-#define AARCH64_V0_REGNO   34
-#define AARCH64_FPSR_REGNO (AARCH64_V0_REGNO + AARCH64_V_REGS_NUM)
-#define AARCH64_FPCR_REGNO (AARCH64_V0_REGNO + AARCH64_V_REGS_NUM + 1)
-
-#define AARCH64_NUM_REGS (AARCH64_V0_REGNO + AARCH64_V_REGS_NUM + 2)
-
  /* Per-process arch-specific data we want to keep.  */
  
  struct arch_process_info
@@ -86,70 +75,82 @@ is_64bit_tdesc (void)
    return register_size (regcache->tdesc, 0) == 8;
  }
  
-/* Implementation of linux_target_ops method "cannot_store_register".  */
+/* Return true if the regcache contains the number of SVE registers.  */
  
-static int
-aarch64_cannot_store_register (int regno)
+static bool
+is_sve_tdesc (void)
  {
-  return regno >= AARCH64_NUM_REGS;
-}
-
-/* Implementation of linux_target_ops method "cannot_fetch_register".  */
+  struct regcache *regcache = get_thread_regcache (current_thread, 0);
  
-static int
-aarch64_cannot_fetch_register (int regno)
-{
-  return regno >= AARCH64_NUM_REGS;
+  return regcache->tdesc->reg_defs.size () == AARCH64_SVE_NUM_REGS;
  }
  
  static void
  aarch64_fill_gregset (struct regcache *regcache, void *buf)
  {
-  struct user_pt_regs *regset = buf;
+  struct user_pt_regs *regset = (struct user_pt_regs *) buf;
    int i;
  
    for (i = 0; i < AARCH64_X_REGS_NUM; i++)
-    collect_register (regcache, AARCH64_X0_REGNO + i, &regset->regs[i]);
-  collect_register (regcache, AARCH64_SP_REGNO, &regset->sp);
-  collect_register (regcache, AARCH64_PC_REGNO, &regset->pc);
-  collect_register (regcache, AARCH64_CPSR_REGNO, &regset->pstate);
+    collect_register (regcache, AARCH64_X0_REGNUM + i, &regset->regs[i]);
+  collect_register (regcache, AARCH64_SP_REGNUM, &regset->sp);
+  collect_register (regcache, AARCH64_PC_REGNUM, &regset->pc);
+  collect_register (regcache, AARCH64_CPSR_REGNUM, &regset->pstate);
  }
  
  static void
  aarch64_store_gregset (struct regcache *regcache, const void *buf)
  {
-  const struct user_pt_regs *regset = buf;
+  const struct user_pt_regs *regset = (const struct user_pt_regs *) buf;
    int i;
  
    for (i = 0; i < AARCH64_X_REGS_NUM; i++)
-    supply_register (regcache, AARCH64_X0_REGNO + i, &regset->regs[i]);
-  supply_register (regcache, AARCH64_SP_REGNO, &regset->sp);
-  supply_register (regcache, AARCH64_PC_REGNO, &regset->pc);
-  supply_register (regcache, AARCH64_CPSR_REGNO, &regset->pstate);
+    supply_register (regcache, AARCH64_X0_REGNUM + i, &regset->regs[i]);
+  supply_register (regcache, AARCH64_SP_REGNUM, &regset->sp);
+  supply_register (regcache, AARCH64_PC_REGNUM, &regset->pc);
+  supply_register (regcache, AARCH64_CPSR_REGNUM, &regset->pstate);
  }
  
  static void
  aarch64_fill_fpregset (struct regcache *regcache, void *buf)
  {
-  struct user_fpsimd_state *regset = buf;
+  struct user_fpsimd_state *regset = (struct user_fpsimd_state *) buf;
    int i;
  
    for (i = 0; i < AARCH64_V_REGS_NUM; i++)
-    collect_register (regcache, AARCH64_V0_REGNO + i, &regset->vregs[i]);
-  collect_register (regcache, AARCH64_FPSR_REGNO, &regset->fpsr);
-  collect_register (regcache, AARCH64_FPCR_REGNO, &regset->fpcr);
+    collect_register (regcache, AARCH64_V0_REGNUM + i, &regset->vregs[i]);
+  collect_register (regcache, AARCH64_FPSR_REGNUM, &regset->fpsr);
+  collect_register (regcache, AARCH64_FPCR_REGNUM, &regset->fpcr);
  }
  
  static void
  aarch64_store_fpregset (struct regcache *regcache, const void *buf)
  {
-  const struct user_fpsimd_state *regset = buf;
+  const struct user_fpsimd_state *regset
+    = (const struct user_fpsimd_state *) buf;
    int i;
  
    for (i = 0; i < AARCH64_V_REGS_NUM; i++)
-    supply_register (regcache, AARCH64_V0_REGNO + i, &regset->vregs[i]);
-  supply_register (regcache, AARCH64_FPSR_REGNO, &regset->fpsr);
-  supply_register (regcache, AARCH64_FPCR_REGNO, &regset->fpcr);
+    supply_register (regcache, AARCH64_V0_REGNUM + i, &regset->vregs[i]);
+  supply_register (regcache, AARCH64_FPSR_REGNUM, &regset->fpsr);
+  supply_register (regcache, AARCH64_FPCR_REGNUM, &regset->fpcr);
+}
+
+/* Store the pauth registers to regcache.  */
+
+static void
+aarch64_store_pauthregset (struct regcache *regcache, const void *buf)
+{
+  uint64_t *pauth_regset = (uint64_t *) buf;
+  int pauth_base = find_regno (regcache->tdesc, "pauth_dmask");
+
+  if (pauth_base == 0)
+    return;
+
+  supply_register (regcache, AARCH64_PAUTH_DMASK_REGNUM (pauth_base),
+                  &pauth_regset[0]);
+  supply_register (regcache, AARCH64_PAUTH_CMASK_REGNUM (pauth_base),
+                  &pauth_regset[1]);
  }
  
  /* Enable miscellaneous debugging output.  The name is historical - it
@@ -162,23 +163,9 @@ static CORE_ADDR
  aarch64_get_pc (struct regcache *regcache)
  {
    if (register_size (regcache->tdesc, 0) == 8)
-    {
-      unsigned long pc;
-
-      collect_register_by_name (regcache, "pc", &pc);
-      if (debug_threads)
-       debug_printf ("stop pc is %08lx\n", pc);
-      return pc;
-    }
+    return linux_get_pc_64bit (regcache);
    else
-    {
-      unsigned int pc;
-
-      collect_register_by_name (regcache, "pc", &pc);
-      if (debug_threads)
-       debug_printf ("stop pc is %04x\n", pc);
-      return pc;
-    }
+    return linux_get_pc_32bit (regcache);
  }
  
  /* Implementation of linux_target_ops method "set_pc".  */
@@ -187,15 +174,9 @@ static void
  aarch64_set_pc (struct regcache *regcache, CORE_ADDR pc)
  {
    if (register_size (regcache->tdesc, 0) == 8)
-    {
-      unsigned long newpc = pc;
-      supply_register_by_name (regcache, "pc", &newpc);
-    }
+    linux_set_pc_64bit (regcache, pc);
    else
-    {
-      unsigned int newpc = pc;
-      supply_register_by_name (regcache, "pc", &newpc);
-    }
+    linux_set_pc_32bit (regcache, pc);
  }
  
  #define aarch64_breakpoint_len 4
@@ -210,14 +191,19 @@ static const gdb_byte aarch64_breakpoint[] = {0x00, 0x00, 0x20, 0xd4};
  static int
  aarch64_breakpoint_at (CORE_ADDR where)
  {
-  gdb_byte insn[aarch64_breakpoint_len];
+  if (is_64bit_tdesc ())
+    {
+      gdb_byte insn[aarch64_breakpoint_len];
  
-  (*the_target->read_memory) (where, (unsigned char *) &insn,
-                             aarch64_breakpoint_len);
-  if (memcmp (insn, aarch64_breakpoint, aarch64_breakpoint_len) == 0)
-    return 1;
+      (*the_target->read_memory) (where, (unsigned char *) &insn,
+                                 aarch64_breakpoint_len);
+      if (memcmp (insn, aarch64_breakpoint, aarch64_breakpoint_len) == 0)
+       return 1;
  
-  return 0;
+      return 0;
+    }
+  else
+    return arm_breakpoint_at (where);
  }
  
  static void
@@ -259,22 +245,6 @@ aarch64_supports_z_point_type (char z_type)
    switch (z_type)
      {
      case Z_PACKET_SW_BP:
-      {
-       if (!extended_protocol && is_64bit_tdesc ())
-         {
-           /* Only enable Z0 packet in non-multi-arch debugging.  If
-              extended protocol is used, don't enable Z0 packet because
-              GDBserver may attach to 32-bit process.  */
-           return 1;
-         }
-       else
-         {
-           /* Disable Z0 packet so that GDBserver doesn't have to handle
-              different breakpoint instructions (aarch64, arm, thumb etc)
-              in multi-arch debugging.  */
-           return 0;
-         }
-      }
      case Z_PACKET_HW_BP:
      case Z_PACKET_WRITE_WP:
      case Z_PACKET_READ_WP:
@@ -315,9 +285,17 @@ aarch64_insert_point (enum raw_bkpt_type type, CORE_ADDR addr,
         ret = -1;
      }
    else
-    ret =
-      aarch64_handle_breakpoint (targ_type, addr, len, 1 /* is_insert */,
-                                state);
+    {
+      if (len == 3)
+       {
+         /* LEN is 3 means the breakpoint is set on a 32-bit thumb
+            instruction.   Set it to 2 to correctly encode length bit
+            mask in hardware/watchpoint control register.  */
+         len = 2;
+       }
+      ret = aarch64_handle_breakpoint (targ_type, addr, len,
+                                      1 /* is_insert */, state);
+    }
  
    if (show_debug_regs)
      aarch64_show_debug_reg_state (state, "insert_point", addr, len,
@@ -353,9 +331,17 @@ aarch64_remove_point (enum raw_bkpt_type type, CORE_ADDR addr,
        aarch64_handle_watchpoint (targ_type, addr, len, 0 /* is_insert */,
                                  state);
    else
-    ret =
-      aarch64_handle_breakpoint (targ_type, addr, len, 0 /* is_insert */,
-                                state);
+    {
+      if (len == 3)
+       {
+         /* LEN is 3 means the breakpoint is set on a 32-bit thumb
+            instruction.   Set it to 2 to correctly encode length bit
+            mask in hardware/watchpoint control register.  */
+         len = 2;
+       }
+      ret = aarch64_handle_breakpoint (targ_type, addr, len,
+                                      0 /* is_insert */,  state);
+    }
  
    if (show_debug_regs)
      aarch64_show_debug_reg_state (state, "remove_point", addr, len,
@@ -388,14 +374,39 @@ aarch64_stopped_data_address (void)
    state = aarch64_get_debug_reg_state (pid_of (current_thread));
    for (i = aarch64_num_wp_regs - 1; i >= 0; --i)
      {
+      const unsigned int offset
+       = aarch64_watchpoint_offset (state->dr_ctrl_wp[i]);
        const unsigned int len = aarch64_watchpoint_length (state->dr_ctrl_wp[i]);
        const CORE_ADDR addr_trap = (CORE_ADDR) siginfo.si_addr;
-      const CORE_ADDR addr_watch = state->dr_addr_wp[i];
+      const CORE_ADDR addr_watch = state->dr_addr_wp[i] + offset;
+      const CORE_ADDR addr_watch_aligned = align_down (state->dr_addr_wp[i], 8);
+      const CORE_ADDR addr_orig = state->dr_addr_orig_wp[i];
+
        if (state->dr_ref_count_wp[i]
           && DR_CONTROL_ENABLED (state->dr_ctrl_wp[i])
-         && addr_trap >= addr_watch
+         && addr_trap >= addr_watch_aligned
           && addr_trap < addr_watch + len)
-       return addr_trap;
+       {
+         /* ADDR_TRAP reports the first address of the memory range
+            accessed by the CPU, regardless of what was the memory
+            range watched.  Thus, a large CPU access that straddles
+            the ADDR_WATCH..ADDR_WATCH+LEN range may result in an
+            ADDR_TRAP that is lower than the
+            ADDR_WATCH..ADDR_WATCH+LEN range.  E.g.:
+
+            addr: |   4   |   5   |   6   |   7   |   8   |
+                                  |---- range watched ----|
+                  |----------- range accessed ------------|
+
+            In this case, ADDR_TRAP will be 4.
+
+            To match a watchpoint known to GDB core, we must never
+            report *ADDR_P outside of any ADDR_WATCH..ADDR_WATCH+LEN
+            range.  ADDR_WATCH <= ADDR_TRAP < ADDR_ORIG is a false
+            positive on kernels older than 4.10.  See PR
+            external/20207.  */
+         return addr_orig;
+       }
      }
  
    return (CORE_ADDR) 0;
@@ -415,7 +426,7 @@ aarch64_stopped_by_watchpoint (void)
  /* Fetch the thread-local storage pointer for libthread_db.  */
  
  ps_err_e
-ps_get_thread_area (const struct ps_prochandle *ph,
+ps_get_thread_area (struct ps_prochandle *ph,
                     lwpid_t lwpid, int idx, void **base)
  {
    return aarch64_ps_get_thread_area (ph, lwpid, idx, base,
@@ -425,7 +436,7 @@ ps_get_thread_area (const struct ps_prochandle *ph,
  /* Implementation of linux_target_ops method "siginfo_fixup".  */
  
  static int
-aarch64_linux_siginfo_fixup (siginfo_t *native, void *inf, int direction)
+aarch64_linux_siginfo_fixup (siginfo_t *native, gdb_byte *inf, int direction)
  {
    /* Is the inferior 32-bit?  If so, then fixup the siginfo object.  */
    if (!is_64bit_tdesc ())
@@ -443,7 +454,7 @@ aarch64_linux_siginfo_fixup (siginfo_t *native, void *inf, int direction)
    return 0;
  }
  
-/* Implementation of linux_target_ops method "linux_new_process".  */
+/* Implementation of linux_target_ops method "new_process".  */
  
  static struct arch_process_info *
  aarch64_linux_new_process (void)
@@ -455,6 +466,14 @@ aarch64_linux_new_process (void)
    return info;
  }
  
+/* Implementation of linux_target_ops method "delete_process".  */
+
+static void
+aarch64_linux_delete_process (struct arch_process_info *info)
+{
+  xfree (info);
+}
+
  /* Implementation of linux_target_ops method "linux_new_fork".  */
  
  static void
@@ -484,11 +503,13 @@ aarch64_linux_new_fork (struct process_info *parent,
    *child->priv->arch_private = *parent->priv->arch_private;
  }
  
-/* Return the right target description according to the ELF file of
-   current thread.  */
+/* Matches HWCAP_PACA in kernel header arch/arm64/include/uapi/asm/hwcap.h.  */
+#define AARCH64_HWCAP_PACA (1 << 30)
+
+/* Implementation of linux_target_ops method "arch_setup".  */
  
-static const struct target_desc *
-aarch64_linux_read_description (void)
+static void
+aarch64_arch_setup (void)
  {
    unsigned int machine;
    int is_elf64;
@@ -499,19 +520,33 @@ aarch64_linux_read_description (void)
    is_elf64 = linux_pid_exe_is_elf_64_file (tid, &machine);
  
    if (is_elf64)
-    return tdesc_aarch64;
+    {
+      uint64_t vq = aarch64_sve_get_vq (tid);
+      unsigned long hwcap = linux_get_hwcap (8);
+      bool pauth_p = hwcap & AARCH64_HWCAP_PACA;
+
+      current_process ()->tdesc = aarch64_linux_read_description (vq, pauth_p);
+    }
    else
-    return tdesc_arm_with_neon;
+    current_process ()->tdesc = aarch32_linux_read_description ();
+
+  aarch64_linux_get_debug_reg_capacity (lwpid_of (current_thread));
  }
  
-/* Implementation of linux_target_ops method "arch_setup".  */
+/* Wrapper for aarch64_sve_regs_copy_to_reg_buf.  */
  
  static void
-aarch64_arch_setup (void)
+aarch64_sve_regs_copy_to_regcache (struct regcache *regcache, const void *buf)
  {
-  current_process ()->tdesc = aarch64_linux_read_description ();
+  return aarch64_sve_regs_copy_to_reg_buf (regcache, buf);
+}
  
-  aarch64_linux_get_debug_reg_capacity (lwpid_of (current_thread));
+/* Wrapper for aarch64_sve_regs_copy_from_reg_buf.  */
+
+static void
+aarch64_sve_regs_copy_from_regcache (struct regcache *regcache, void *buf)
+{
+  return aarch64_sve_regs_copy_from_reg_buf (regcache, buf);
  }
  
  static struct regset_info aarch64_regsets[] =
@@ -523,7 +558,10 @@ static struct regset_info aarch64_regsets[] =
      sizeof (struct user_fpsimd_state), FP_REGS,
      aarch64_fill_fpregset, aarch64_store_fpregset
    },
-  { 0, 0, 0, -1, -1, NULL, NULL }
+  { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_ARM_PAC_MASK,
+    AARCH64_PAUTH_REGS_SIZE, OPTIONAL_REGS,
+    NULL, aarch64_store_pauthregset },
+  NULL_REGSET
  };
  
  static struct regsets_info aarch64_regsets_info =
@@ -540,15 +578,47 @@ static struct regs_info regs_info_aarch64 =
      &aarch64_regsets_info,
    };
  
+static struct regset_info aarch64_sve_regsets[] =
+{
+  { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_PRSTATUS,
+    sizeof (struct user_pt_regs), GENERAL_REGS,
+    aarch64_fill_gregset, aarch64_store_gregset },
+  { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_ARM_SVE,
+    SVE_PT_SIZE (AARCH64_MAX_SVE_VQ, SVE_PT_REGS_SVE), EXTENDED_REGS,
+    aarch64_sve_regs_copy_from_regcache, aarch64_sve_regs_copy_to_regcache
+  },
+  { PTRACE_GETREGSET, PTRACE_SETREGSET, NT_ARM_PAC_MASK,
+    AARCH64_PAUTH_REGS_SIZE, OPTIONAL_REGS,
+    NULL, aarch64_store_pauthregset },
+  NULL_REGSET
+};
+
+static struct regsets_info aarch64_sve_regsets_info =
+  {
+    aarch64_sve_regsets, /* regsets.  */
+    0, /* num_regsets.  */
+    NULL, /* disabled_regsets.  */
+  };
+
+static struct regs_info regs_info_aarch64_sve =
+  {
+    NULL, /* regset_bitmap.  */
+    NULL, /* usrregs.  */
+    &aarch64_sve_regsets_info,
+  };
+
  /* Implementation of linux_target_ops method "regs_info".  */
  
  static const struct regs_info *
  aarch64_regs_info (void)
  {
-  if (is_64bit_tdesc ())
-    return &regs_info_aarch64;
-  else
+  if (!is_64bit_tdesc ())
      return &regs_info_aarch32;
+
+  if (is_sve_tdesc ())
+    return &regs_info_aarch64_sve;
+
+  return &regs_info_aarch64;
  }
  
  /* Implementation of linux_target_ops method "supports_tracepoints".  */
@@ -584,156 +654,24 @@ aarch64_get_thread_area (int lwpid, CORE_ADDR *addrp)
    return 0;
  }
  
-/* Extract a signed value from a bit field within an instruction
-   encoding.
-
-   INSN is the instruction opcode.
-
-   WIDTH specifies the width of the bit field to extract (in bits).
+/* Implementation of linux_target_ops method "get_syscall_trapinfo".  */
  
-   OFFSET specifies the least significant bit of the field where bits
-   are numbered zero counting from least to most significant.  */
-
-static int32_t
-extract_signed_bitfield (uint32_t insn, unsigned width, unsigned offset)
+static void
+aarch64_get_syscall_trapinfo (struct regcache *regcache, int *sysno)
  {
-  unsigned shift_l = sizeof (int32_t) * 8 - (offset + width);
-  unsigned shift_r = sizeof (int32_t) * 8 - width;
-
-  return ((int32_t) insn << shift_l) >> shift_r;
-}
-
-/* Decode an opcode if it represents an LDR or LDRSW instruction taking a
-   literal offset from the current PC.
-
-   ADDR specifies the address of the opcode.
-   INSN specifies the opcode to test.
-   IS_W is set if the instruction is LDRSW.
-   IS64 receives size field from the decoded instruction.
-   RT receives the 'rt' field from the decoded instruction.
-   OFFSET receives the 'imm' field from the decoded instruction.
-
-   Return 1 if the opcodes matches and is decoded, otherwise 0.  */
+  int use_64bit = register_size (regcache->tdesc, 0) == 8;
  
-int
-aarch64_decode_ldr_literal (CORE_ADDR addr, uint32_t insn, int *is_w,
-                           int *is64, unsigned *rt, int32_t *offset)
-{
-  /* LDR    0T01 1000 iiii iiii iiii iiii iiir rrrr */
-  /* LDRSW  1001 1000 iiii iiii iiii iiii iiir rrrr */
-  if ((insn & 0x3f000000) == 0x18000000)
+  if (use_64bit)
      {
-      *is_w = (insn >> 31) & 0x1;
-
-      if (*is_w)
-       {
-         /* LDRSW always takes a 64-bit destination registers.  */
-         *is64 = 1;
-       }
-      else
-       *is64 = (insn >> 30) & 0x1;
+      long l_sysno;
  
-      *rt = (insn >> 0) & 0x1f;
-      *offset = extract_signed_bitfield (insn, 19, 5) << 2;
-
-      if (aarch64_debug)
-       debug_printf ("decode: %s 0x%x %s %s%u, #?\n",
-                     core_addr_to_string_nz (addr), insn,
-                     *is_w ? "ldrsw" : "ldr",
-                     *is64 ? "x" : "w", *rt);
-
-      return 1;
+      collect_register_by_name (regcache, "x8", &l_sysno);
+      *sysno = (int) l_sysno;
      }
-
-  return 0;
+  else
+    collect_register_by_name (regcache, "r7", sysno);
  }
  
-/* List of opcodes that we need for building the jump pad and relocating
-   an instruction.  */
-
-enum aarch64_opcodes
-{
-  /* B              0001 01ii iiii iiii iiii iiii iiii iiii */
-  /* BL             1001 01ii iiii iiii iiii iiii iiii iiii */
-  /* B.COND         0101 0100 iiii iiii iiii iiii iii0 cccc */
-  /* CBZ            s011 0100 iiii iiii iiii iiii iiir rrrr */
-  /* CBNZ           s011 0101 iiii iiii iiii iiii iiir rrrr */
-  /* TBZ            b011 0110 bbbb biii iiii iiii iiir rrrr */
-  /* TBNZ           b011 0111 bbbb biii iiii iiii iiir rrrr */
-  B               = 0x14000000,
-  BL              = 0x80000000 | B,
-  BCOND           = 0x40000000 | B,
-  CBZ             = 0x20000000 | B,
-  CBNZ            = 0x21000000 | B,
-  TBZ             = 0x36000000 | B,
-  TBNZ            = 0x37000000 | B,
-  /* BLR            1101 0110 0011 1111 0000 00rr rrr0 0000 */
-  BLR             = 0xd63f0000,
-  /* RET            1101 0110 0101 1111 0000 00rr rrr0 0000 */
-  RET             = 0xd65f0000,
-  /* STP            s010 100o o0ii iiii irrr rrrr rrrr rrrr */
-  /* LDP            s010 100o o1ii iiii irrr rrrr rrrr rrrr */
-  /* STP (SIMD&VFP) ss10 110o o0ii iiii irrr rrrr rrrr rrrr */
-  /* LDP (SIMD&VFP) ss10 110o o1ii iiii irrr rrrr rrrr rrrr */
-  STP             = 0x28000000,
-  LDP             = 0x28400000,
-  STP_SIMD_VFP    = 0x04000000 | STP,
-  LDP_SIMD_VFP    = 0x04000000 | LDP,
-  /* STR            ss11 100o 00xi iiii iiii xxrr rrrr rrrr */
-  /* LDR            ss11 100o 01xi iiii iiii xxrr rrrr rrrr */
-  /* LDRSW          1011 100o 10xi iiii iiii xxrr rrrr rrrr */
-  STR             = 0x38000000,
-  LDR             = 0x00400000 | STR,
-  LDRSW           = 0x80800000 | STR,
-  /* LDAXR          ss00 1000 0101 1111 1111 11rr rrrr rrrr */
-  LDAXR           = 0x085ffc00,
-  /* STXR           ss00 1000 000r rrrr 0111 11rr rrrr rrrr */
-  STXR            = 0x08007c00,
-  /* STLR           ss00 1000 1001 1111 1111 11rr rrrr rrrr */
-  STLR            = 0x089ffc00,
-  /* MOV            s101 0010 1xxi iiii iiii iiii iiir rrrr */
-  /* MOVK           s111 0010 1xxi iiii iiii iiii iiir rrrr */
-  MOV             = 0x52800000,
-  MOVK            = 0x20000000 | MOV,
-  /* ADD            s00o ooo1 xxxx xxxx xxxx xxxx xxxx xxxx */
-  /* SUB            s10o ooo1 xxxx xxxx xxxx xxxx xxxx xxxx */
-  /* SUBS           s11o ooo1 xxxx xxxx xxxx xxxx xxxx xxxx */
-  ADD             = 0x01000000,
-  SUB             = 0x40000000 | ADD,
-  SUBS            = 0x20000000 | SUB,
-  /* AND            s000 1010 xx0x xxxx xxxx xxxx xxxx xxxx */
-  /* ORR            s010 1010 xx0x xxxx xxxx xxxx xxxx xxxx */
-  /* ORN            s010 1010 xx1x xxxx xxxx xxxx xxxx xxxx */
-  /* EOR            s100 1010 xx0x xxxx xxxx xxxx xxxx xxxx */
-  AND             = 0x0a000000,
-  ORR             = 0x20000000 | AND,
-  ORN             = 0x00200000 | ORR,
-  EOR             = 0x40000000 | AND,
-  /* LSLV           s001 1010 110r rrrr 0010 00rr rrrr rrrr */
-  /* LSRV           s001 1010 110r rrrr 0010 01rr rrrr rrrr */
-  /* ASRV           s001 1010 110r rrrr 0010 10rr rrrr rrrr */
-  LSLV             = 0x1ac02000,
-  LSRV             = 0x00000400 | LSLV,
-  ASRV             = 0x00000800 | LSLV,
-  /* SBFM           s001 0011 0nii iiii iiii iirr rrrr rrrr */
-  SBFM            = 0x13000000,
-  /* UBFM           s101 0011 0nii iiii iiii iirr rrrr rrrr */
-  UBFM            = 0x40000000 | SBFM,
-  /* CSINC          s001 1010 100r rrrr cccc 01rr rrrr rrrr */
-  CSINC           = 0x9a800400,
-  /* MUL            s001 1011 000r rrrr 0111 11rr rrrr rrrr */
-  MUL             = 0x1b007c00,
-  /* MSR (register) 1101 0101 0001 oooo oooo oooo ooor rrrr */
-  /* MRS            1101 0101 0011 oooo oooo oooo ooor rrrr */
-  MSR             = 0xd5100000,
-  MRS             = 0x00200000 | MSR,
-  /* HINT           1101 0101 0000 0011 0010 oooo ooo1 1111 */
-  HINT            = 0xd503201f,
-  SEVL            = (5 << 5) | HINT,
-  WFE             = (2 << 5) | HINT,
-  NOP             = (0 << 5) | HINT,
-};
-
  /* List of condition codes that we need.  */
  
  enum aarch64_condition_codes
@@ -747,14 +685,10 @@ enum aarch64_condition_codes
    LE = 0xd,
  };
  
-/* Representation of a general purpose register of the form xN or wN.
-
-   This type is used by emitting functions that take registers as operands.  */
-
-struct aarch64_register
+enum aarch64_operand_type
  {
-  unsigned num;
-  int is64;
+  OPERAND_IMMEDIATE,
+  OPERAND_REGISTER,
  };
  
  /* Representation of an operand.  At this time, it only supports register
@@ -763,11 +697,8 @@ struct aarch64_register
  struct aarch64_operand
  {
    /* Type of the operand.  */
-  enum
-    {
-      OPERAND_IMMEDIATE,
-      OPERAND_REGISTER,
-    } type;
+  enum aarch64_operand_type type;
+
    /* Value of the operand according to the type.  */
    union
      {
@@ -843,28 +774,6 @@ immediate_operand (uint32_t imm)
    return operand;
  }
  
-/* Representation of a memory operand, used for load and store
-   instructions.
-
-   The types correspond to the following variants:
-
-   MEMORY_OPERAND_OFFSET:    LDR rt, [rn, #offset]
-   MEMORY_OPERAND_PREINDEX:  LDR rt, [rn, #index]!
-   MEMORY_OPERAND_POSTINDEX: LDR rt, [rn], #index  */
-
-struct aarch64_memory_operand
-{
-  /* Type of the operand.  */
-  enum
-    {
-      MEMORY_OPERAND_OFFSET,
-      MEMORY_OPERAND_PREINDEX,
-      MEMORY_OPERAND_POSTINDEX,
-    } type;
-  /* Index from the base register.  */
-  int32_t index;
-};
-
  /* Helper function to create an offset memory operand.
  
     For example:
@@ -916,108 +825,6 @@ enum aarch64_system_control_registers
    TPIDR_EL0 = (0x1 << 14) | (0x3 << 11) | (0xd << 7) | (0x0 << 3) | 0x2
  };
  
-/* Helper macro to mask and shift a value into a bitfield.  */
-
-#define ENCODE(val, size, offset) \
-  ((uint32_t) ((val & ((1ULL << size) - 1)) << offset))
-
-/* Write a 32-bit unsigned integer INSN info *BUF.  Return the number of
-   instructions written (aka. 1).  */
-
-static int
-emit_insn (uint32_t *buf, uint32_t insn)
-{
-  *buf = insn;
-  return 1;
-}
-
-/* Write a B or BL instruction into *BUF.
-
-     B  #offset
-     BL #offset
-
-   IS_BL specifies if the link register should be updated.
-   OFFSET is the immediate offset from the current PC.  It is
-   byte-addressed but should be 4 bytes aligned.  It has a limited range of
-   +/- 128MB (26 bits << 2).  */
-
-static int
-emit_b (uint32_t *buf, int is_bl, int32_t offset)
-{
-  uint32_t imm26 = ENCODE (offset >> 2, 26, 0);
-
-  if (is_bl)
-    return emit_insn (buf, BL | imm26);
-  else
-    return emit_insn (buf, B | imm26);
-}
-
-/* Write a BCOND instruction into *BUF.
-
-     B.COND #offset
-
-   COND specifies the condition field.
-   OFFSET is the immediate offset from the current PC.  It is
-   byte-addressed but should be 4 bytes aligned.  It has a limited range of
-   +/- 1MB (19 bits << 2).  */
-
-static int
-emit_bcond (uint32_t *buf, unsigned cond, int32_t offset)
-{
-  return emit_insn (buf, BCOND | ENCODE (offset >> 2, 19, 5)
-                   | ENCODE (cond, 4, 0));
-}
-
-/* Write a CBZ or CBNZ instruction into *BUF.
-
-     CBZ  rt, #offset
-     CBNZ rt, #offset
-
-   IS_CBNZ distinguishes between CBZ and CBNZ instructions.
-   RN is the register to test.
-   OFFSET is the immediate offset from the current PC.  It is
-   byte-addressed but should be 4 bytes aligned.  It has a limited range of
-   +/- 1MB (19 bits << 2).  */
-
-static int
-emit_cb (uint32_t *buf, int is_cbnz, struct aarch64_register rt,
-        int32_t offset)
-{
-  uint32_t imm19 = ENCODE (offset >> 2, 19, 5);
-  uint32_t sf = ENCODE (rt.is64, 1, 31);
-
-  if (is_cbnz)
-    return emit_insn (buf, CBNZ | sf | imm19 | ENCODE (rt.num, 5, 0));
-  else
-    return emit_insn (buf, CBZ | sf | imm19 | ENCODE (rt.num, 5, 0));
-}
-
-/* Write a TBZ or TBNZ instruction into *BUF.
-
-     TBZ  rt, #bit, #offset
-     TBNZ rt, #bit, #offset
-
-   IS_TBNZ distinguishes between TBZ and TBNZ instructions.
-   RT is the register to test.
-   BIT is the index of the bit to test in register RT.
-   OFFSET is the immediate offset from the current PC.  It is
-   byte-addressed but should be 4 bytes aligned.  It has a limited range of
-   +/- 32KB (14 bits << 2).  */
-
-static int
-emit_tb (uint32_t *buf, int is_tbnz, unsigned bit,
-        struct aarch64_register rt, int32_t offset)
-{
-  uint32_t imm14 = ENCODE (offset >> 2, 14, 5);
-  uint32_t b40 = ENCODE (bit, 5, 19);
-  uint32_t b5 = ENCODE (bit >> 5, 1, 31);
-
-  if (is_tbnz)
-    return emit_insn (buf, TBNZ | b5 | b40 | imm14 | ENCODE (rt.num, 5, 0));
-  else
-    return emit_insn (buf, TBZ | b5 | b40 | imm14 | ENCODE (rt.num, 5, 0));
-}
-
  /* Write a BLR instruction into *BUF.
  
       BLR rn
@@ -1027,7 +834,7 @@ emit_tb (uint32_t *buf, int is_tbnz, unsigned bit,
  static int
  emit_blr (uint32_t *buf, struct aarch64_register rn)
  {
-  return emit_insn (buf, BLR | ENCODE (rn.num, 5, 5));
+  return aarch64_emit_insn (buf, BLR | ENCODE (rn.num, 5, 5));
  }
  
  /* Write a RET instruction into *BUF.
@@ -1039,7 +846,7 @@ emit_blr (uint32_t *buf, struct aarch64_register rn)
  static int
  emit_ret (uint32_t *buf, struct aarch64_register rn)
  {
-  return emit_insn (buf, RET | ENCODE (rn.num, 5, 5));
+  return aarch64_emit_insn (buf, RET | ENCODE (rn.num, 5, 5));
  }
  
  static int
@@ -1082,10 +889,10 @@ emit_load_store_pair (uint32_t *buf, enum aarch64_opcodes opcode,
        return 0;
      }
  
-  return emit_insn (buf, opcode | opc | pre_index | write_back
-                   | ENCODE (operand.index >> 3, 7, 15)
-                   | ENCODE (rt2.num, 5, 10)
-                   | ENCODE (rn.num, 5, 5) | ENCODE (rt.num, 5, 0));
+  return aarch64_emit_insn (buf, opcode | opc | pre_index | write_back
+                           | ENCODE (operand.index >> 3, 7, 15)
+                           | ENCODE (rt2.num, 5, 10)
+                           | ENCODE (rn.num, 5, 5) | ENCODE (rt.num, 5, 0));
  }
  
  /* Write a STP instruction into *BUF.
@@ -1142,9 +949,10 @@ emit_ldp_q_offset (uint32_t *buf, unsigned rt, unsigned rt2,
    uint32_t opc = ENCODE (2, 2, 30);
    uint32_t pre_index = ENCODE (1, 1, 24);
  
-  return emit_insn (buf, LDP_SIMD_VFP | opc | pre_index
-                   | ENCODE (offset >> 4, 7, 15) | ENCODE (rt2, 5, 10)
-                   | ENCODE (rn.num, 5, 5) | ENCODE (rt, 5, 0));
+  return aarch64_emit_insn (buf, LDP_SIMD_VFP | opc | pre_index
+                           | ENCODE (offset >> 4, 7, 15)
+                           | ENCODE (rt2, 5, 10)
+                           | ENCODE (rn.num, 5, 5) | ENCODE (rt, 5, 0));
  }
  
  /* Write a STP (SIMD&VFP) instruction using Q registers into *BUF.
@@ -1163,71 +971,10 @@ emit_stp_q_offset (uint32_t *buf, unsigned rt, unsigned rt2,
    uint32_t opc = ENCODE (2, 2, 30);
    uint32_t pre_index = ENCODE (1, 1, 24);
  
-  return emit_insn (buf, STP_SIMD_VFP | opc | pre_index
-                   | ENCODE (offset >> 4, 7, 15) | ENCODE (rt2, 5, 10)
-                   | ENCODE (rn.num, 5, 5) | ENCODE (rt, 5, 0));
-}
-
-/* Helper function emitting a load or store instruction.  */
-
-static int
-emit_load_store (uint32_t *buf, uint32_t size, enum aarch64_opcodes opcode,
-                struct aarch64_register rt, struct aarch64_register rn,
-                struct aarch64_memory_operand operand)
-{
-  uint32_t op;
-
-  switch (operand.type)
-    {
-    case MEMORY_OPERAND_OFFSET:
-      {
-       op = ENCODE (1, 1, 24);
-
-       return emit_insn (buf, opcode | ENCODE (size, 2, 30) | op
-                         | ENCODE (operand.index >> 3, 12, 10)
-                         | ENCODE (rn.num, 5, 5) | ENCODE (rt.num, 5, 0));
-      }
-    case MEMORY_OPERAND_POSTINDEX:
-      {
-       uint32_t post_index = ENCODE (1, 2, 10);
-
-       op = ENCODE (0, 1, 24);
-
-       return emit_insn (buf, opcode | ENCODE (size, 2, 30) | op
-                         | post_index | ENCODE (operand.index, 9, 12)
-                         | ENCODE (rn.num, 5, 5) | ENCODE (rt.num, 5, 0));
-      }
-    case MEMORY_OPERAND_PREINDEX:
-      {
-       uint32_t pre_index = ENCODE (3, 2, 10);
-
-       op = ENCODE (0, 1, 24);
-
-       return emit_insn (buf, opcode | ENCODE (size, 2, 30) | op
-                         | pre_index | ENCODE (operand.index, 9, 12)
-                         | ENCODE (rn.num, 5, 5) | ENCODE (rt.num, 5, 0));
-      }
-    default:
-      return 0;
-    }
-}
-
-/* Write a LDR instruction into *BUF.
-
-     LDR rt, [rn, #offset]
-     LDR rt, [rn, #index]!
-     LDR rt, [rn], #index
-
-   RT is the register to store.
-   RN is the base address register.
-   OFFSET is the immediate to add to the base address.  It is limited to
-   0 .. 32760 range (12 bits << 3).  */
-
-static int
-emit_ldr (uint32_t *buf, struct aarch64_register rt,
-         struct aarch64_register rn, struct aarch64_memory_operand operand)
-{
-  return emit_load_store (buf, rt.is64 ? 3 : 2, LDR, rt, rn, operand);
+  return aarch64_emit_insn (buf, STP_SIMD_VFP | opc | pre_index
+                           | ENCODE (offset >> 4, 7, 15)
+                           | ENCODE (rt2, 5, 10)
+                           | ENCODE (rn.num, 5, 5) | ENCODE (rt, 5, 0));
  }
  
  /* Write a LDRH instruction into *BUF.
@@ -1246,7 +993,7 @@ emit_ldrh (uint32_t *buf, struct aarch64_register rt,
            struct aarch64_register rn,
            struct aarch64_memory_operand operand)
  {
-  return emit_load_store (buf, 1, LDR, rt, rn, operand);
+  return aarch64_emit_load_store (buf, 1, LDR, rt, rn, operand);
  }
  
  /* Write a LDRB instruction into *BUF.
@@ -1265,27 +1012,10 @@ emit_ldrb (uint32_t *buf, struct aarch64_register rt,
            struct aarch64_register rn,
            struct aarch64_memory_operand operand)
  {
-  return emit_load_store (buf, 0, LDR, rt, rn, operand);
+  return aarch64_emit_load_store (buf, 0, LDR, rt, rn, operand);
  }
  
-/* Write a LDRSW instruction into *BUF.  The register size is 64-bit.
-
-     LDRSW xt, [rn, #offset]
-     LDRSW xt, [rn, #index]!
-     LDRSW xt, [rn], #index
-
-   RT is the register to store.
-   RN is the base address register.
-   OFFSET is the immediate to add to the base address.  It is limited to
-   0 .. 16380 range (12 bits << 2).  */
  
-static int
-emit_ldrsw (uint32_t *buf, struct aarch64_register rt,
-                  struct aarch64_register rn,
-                  struct aarch64_memory_operand operand)
-{
-  return emit_load_store (buf, 3, LDRSW, rt, rn, operand);
-}
  
  /* Write a STR instruction into *BUF.
  
@@ -1303,7 +1033,7 @@ emit_str (uint32_t *buf, struct aarch64_register rt,
           struct aarch64_register rn,
           struct aarch64_memory_operand operand)
  {
-  return emit_load_store (buf, rt.is64 ? 3 : 2, STR, rt, rn, operand);
+  return aarch64_emit_load_store (buf, rt.is64 ? 3 : 2, STR, rt, rn, operand);
  }
  
  /* Helper function emitting an exclusive load or store instruction.  */
@@ -1316,9 +1046,9 @@ emit_load_store_exclusive (uint32_t *buf, uint32_t size,
                            struct aarch64_register rt2,
                            struct aarch64_register rn)
  {
-  return emit_insn (buf, opcode | ENCODE (size, 2, 30)
-                   | ENCODE (rs.num, 5, 16) | ENCODE (rt2.num, 5, 10)
-                   | ENCODE (rn.num, 5, 5) | ENCODE (rt.num, 5, 0));
+  return aarch64_emit_insn (buf, opcode | ENCODE (size, 2, 30)
+                           | ENCODE (rs.num, 5, 16) | ENCODE (rt2.num, 5, 10)
+                           | ENCODE (rn.num, 5, 5) | ENCODE (rt.num, 5, 0));
  }
  
  /* Write a LAXR instruction into *BUF.
@@ -1370,15 +1100,15 @@ emit_stlr (uint32_t *buf, struct aarch64_register rt,
  /* Helper function for data processing instructions with register sources.  */
  
  static int
-emit_data_processing_reg (uint32_t *buf, enum aarch64_opcodes opcode,
+emit_data_processing_reg (uint32_t *buf, uint32_t opcode,
                           struct aarch64_register rd,
                           struct aarch64_register rn,
                           struct aarch64_register rm)
  {
    uint32_t size = ENCODE (rd.is64, 1, 31);
  
-  return emit_insn (buf, opcode | size | ENCODE (rm.num, 5, 16)
-                   | ENCODE (rn.num, 5, 5) | ENCODE (rd.num, 5, 0));
+  return aarch64_emit_insn (buf, opcode | size | ENCODE (rm.num, 5, 16)
+                           | ENCODE (rn.num, 5, 5) | ENCODE (rd.num, 5, 0));
  }
  
  /* Helper function for data processing instructions taking either a register
@@ -1399,9 +1129,10 @@ emit_data_processing (uint32_t *buf, enum aarch64_opcodes opcode,
        /* xxx1 000x xxxx xxxx xxxx xxxx xxxx xxxx */
        operand_opcode = ENCODE (8, 4, 25);
  
-      return emit_insn (buf, opcode | operand_opcode | size
-                       | ENCODE (operand.imm, 12, 10)
-                       | ENCODE (rn.num, 5, 5) | ENCODE (rd.num, 5, 0));
+      return aarch64_emit_insn (buf, opcode | operand_opcode | size
+                               | ENCODE (operand.imm, 12, 10)
+                               | ENCODE (rn.num, 5, 5)
+                               | ENCODE (rd.num, 5, 0));
      }
    else
      {
@@ -1474,9 +1205,9 @@ emit_mov (uint32_t *buf, struct aarch64_register rd,
        /* Do not shift the immediate.  */
        uint32_t shift = ENCODE (0, 2, 21);
  
-      return emit_insn (buf, MOV | size | shift
-                       | ENCODE (operand.imm, 16, 5)
-                       | ENCODE (rd.num, 5, 0));
+      return aarch64_emit_insn (buf, MOV | size | shift
+                               | ENCODE (operand.imm, 16, 5)
+                               | ENCODE (rd.num, 5, 0));
      }
    else
      return emit_add (buf, rd, operand.reg, immediate_operand (0));
@@ -1496,8 +1227,8 @@ emit_movk (uint32_t *buf, struct aarch64_register rd, uint32_t imm,
  {
    uint32_t size = ENCODE (rd.is64, 1, 31);
  
-  return emit_insn (buf, MOVK | size | ENCODE (shift, 2, 21) |
-                   ENCODE (imm, 16, 5) | ENCODE (rd.num, 5, 0));
+  return aarch64_emit_insn (buf, MOVK | size | ENCODE (shift, 2, 21) |
+                           ENCODE (imm, 16, 5) | ENCODE (rd.num, 5, 0));
  }
  
  /* Write instructions into *BUF in order to move ADDR into a register.
@@ -1705,8 +1436,8 @@ static int
  emit_mrs (uint32_t *buf, struct aarch64_register rt,
           enum aarch64_system_control_registers system_reg)
  {
-  return emit_insn (buf, MRS | ENCODE (system_reg, 15, 5)
-                   | ENCODE (rt.num, 5, 0));
+  return aarch64_emit_insn (buf, MRS | ENCODE (system_reg, 15, 5)
+                           | ENCODE (rt.num, 5, 0));
  }
  
  /* Write a MSR instruction into *BUF.  The register size is 64-bit.
@@ -1720,8 +1451,8 @@ static int
  emit_msr (uint32_t *buf, enum aarch64_system_control_registers system_reg,
           struct aarch64_register rt)
  {
-  return emit_insn (buf, MSR | ENCODE (system_reg, 15, 5)
-                   | ENCODE (rt.num, 5, 0));
+  return aarch64_emit_insn (buf, MSR | ENCODE (system_reg, 15, 5)
+                           | ENCODE (rt.num, 5, 0));
  }
  
  /* Write a SEVL instruction into *BUF.
@@ -1731,7 +1462,7 @@ emit_msr (uint32_t *buf, enum aarch64_system_control_registers system_reg,
  static int
  emit_sevl (uint32_t *buf)
  {
-  return emit_insn (buf, SEVL);
+  return aarch64_emit_insn (buf, SEVL);
  }
  
  /* Write a WFE instruction into *BUF.
@@ -1741,7 +1472,7 @@ emit_sevl (uint32_t *buf)
  static int
  emit_wfe (uint32_t *buf)
  {
-  return emit_insn (buf, WFE);
+  return aarch64_emit_insn (buf, WFE);
  }
  
  /* Write a SBFM instruction into *BUF.
@@ -1763,9 +1494,9 @@ emit_sbfm (uint32_t *buf, struct aarch64_register rd,
    uint32_t size = ENCODE (rd.is64, 1, 31);
    uint32_t n = ENCODE (rd.is64, 1, 22);
  
-  return emit_insn (buf, SBFM | size | n | ENCODE (immr, 6, 16)
-                   | ENCODE (imms, 6, 10) | ENCODE (rn.num, 5, 5)
-                   | ENCODE (rd.num, 5, 0));
+  return aarch64_emit_insn (buf, SBFM | size | n | ENCODE (immr, 6, 16)
+                           | ENCODE (imms, 6, 10) | ENCODE (rn.num, 5, 5)
+                           | ENCODE (rd.num, 5, 0));
  }
  
  /* Write a SBFX instruction into *BUF.
@@ -1808,9 +1539,9 @@ emit_ubfm (uint32_t *buf, struct aarch64_register rd,
    uint32_t size = ENCODE (rd.is64, 1, 31);
    uint32_t n = ENCODE (rd.is64, 1, 22);
  
-  return emit_insn (buf, UBFM | size | n | ENCODE (immr, 6, 16)
-                   | ENCODE (imms, 6, 10) | ENCODE (rn.num, 5, 5)
-                   | ENCODE (rd.num, 5, 0));
+  return aarch64_emit_insn (buf, UBFM | size | n | ENCODE (immr, 6, 16)
+                           | ENCODE (imms, 6, 10) | ENCODE (rn.num, 5, 5)
+                           | ENCODE (rd.num, 5, 0));
  }
  
  /* Write a UBFX instruction into *BUF.
@@ -1852,9 +1583,9 @@ emit_csinc (uint32_t *buf, struct aarch64_register rd,
  {
    uint32_t size = ENCODE (rd.is64, 1, 31);
  
-  return emit_insn (buf, CSINC | size | ENCODE (rm.num, 5, 16)
-                   | ENCODE (cond, 4, 12) | ENCODE (rn.num, 5, 5)
-                   | ENCODE (rd.num, 5, 0));
+  return aarch64_emit_insn (buf, CSINC | size | ENCODE (rm.num, 5, 16)
+                           | ENCODE (cond, 4, 12) | ENCODE (rn.num, 5, 5)
+                           | ENCODE (rd.num, 5, 0));
  }
  
  /* Write a CSET instruction into *BUF.
@@ -1880,14 +1611,6 @@ emit_cset (uint32_t *buf, struct aarch64_register rd, unsigned cond)
    return emit_csinc (buf, rd, xzr, xzr, cond ^ 0x1);
  }
  
-/* Write a NOP instruction into *BUF.  */
-
-static int
-emit_nop (uint32_t *buf)
-{
-  return emit_insn (buf, NOP);
-}
-
  /* Write LEN instructions from BUF into the inferior memory at *TO.
  
     Note instructions are always little endian on AArch64, unlike data.  */
@@ -1897,204 +1620,250 @@ append_insns (CORE_ADDR *to, size_t len, const uint32_t *buf)
  {
    size_t byte_len = len * sizeof (uint32_t);
  #if (__BYTE_ORDER == __BIG_ENDIAN)
-  uint32_t *le_buf = xmalloc (byte_len);
+  uint32_t *le_buf = (uint32_t *) xmalloc (byte_len);
    size_t i;
  
    for (i = 0; i < len; i++)
      le_buf[i] = htole32 (buf[i]);
  
-  write_inferior_memory (*to, (const unsigned char *) le_buf, byte_len);
+  target_write_memory (*to, (const unsigned char *) le_buf, byte_len);
  
    xfree (le_buf);
  #else
-  write_inferior_memory (*to, (const unsigned char *) buf, byte_len);
+  target_write_memory (*to, (const unsigned char *) buf, byte_len);
  #endif
  
    *to += byte_len;
  }
  
-/* Helper function.  Return 1 if VAL can be encoded in BITS bits.  */
+/* Sub-class of struct aarch64_insn_data, store information of
+   instruction relocation for fast tracepoint.  Visitor can
+   relocate an instruction from BASE.INSN_ADDR to NEW_ADDR and save
+   the relocated instructions in buffer pointed by INSN_PTR.  */
  
-static int
-can_encode_int32 (int32_t val, unsigned bits)
+struct aarch64_insn_relocation_data
  {
-  /* This must be an arithemic shift.  */
-  int32_t rest = val >> bits;
+  struct aarch64_insn_data base;
  
-  return rest == 0 || rest == -1;
-}
+  /* The new address the instruction is relocated to.  */
+  CORE_ADDR new_addr;
+  /* Pointer to the buffer of relocated instruction(s).  */
+  uint32_t *insn_ptr;
+};
+
+/* Implementation of aarch64_insn_visitor method "b".  */
  
-/* Relocate an instruction INSN from OLDLOC to TO and save the relocated
-   instructions in BUF.  The number of instructions in BUF is returned.
+static void
+aarch64_ftrace_insn_reloc_b (const int is_bl, const int32_t offset,
+                            struct aarch64_insn_data *data)
+{
+  struct aarch64_insn_relocation_data *insn_reloc
+    = (struct aarch64_insn_relocation_data *) data;
+  int64_t new_offset
+    = insn_reloc->base.insn_addr - insn_reloc->new_addr + offset;
  
-   PC relative instructions need to be handled specifically:
+  if (can_encode_int32 (new_offset, 28))
+    insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, is_bl, new_offset);
+}
  
-   - B/BL
-   - B.COND
-   - CBZ/CBNZ
-   - TBZ/TBNZ
-   - ADR/ADRP
-   - LDR/LDRSW (literal)  */
+/* Implementation of aarch64_insn_visitor method "b_cond".  */
  
-static int
-aarch64_relocate_instruction (const CORE_ADDR to, const CORE_ADDR oldloc,
-                             uint32_t insn, uint32_t *buf)
+static void
+aarch64_ftrace_insn_reloc_b_cond (const unsigned cond, const int32_t offset,
+                                 struct aarch64_insn_data *data)
  {
-  uint32_t *p = buf;
+  struct aarch64_insn_relocation_data *insn_reloc
+    = (struct aarch64_insn_relocation_data *) data;
+  int64_t new_offset
+    = insn_reloc->base.insn_addr - insn_reloc->new_addr + offset;
  
-  int is_bl;
-  int is64;
-  int is_sw;
-  int is_cbnz;
-  int is_tbnz;
-  int is_adrp;
-  unsigned rn;
-  unsigned rt;
-  unsigned rd;
-  unsigned cond;
-  unsigned bit;
-  int32_t offset;
-
-  if (aarch64_decode_b (oldloc, insn, &is_bl, &offset))
+  if (can_encode_int32 (new_offset, 21))
      {
-      offset = (oldloc - to + offset);
-
-      if (can_encode_int32 (offset, 28))
-       p += emit_b (p, is_bl, offset);
-      else
-       return 0;
+      insn_reloc->insn_ptr += emit_bcond (insn_reloc->insn_ptr, cond,
+                                         new_offset);
      }
-  else if (aarch64_decode_bcond (oldloc, insn, &cond, &offset))
+  else if (can_encode_int32 (new_offset, 28))
      {
-      offset = (oldloc - to + offset);
-
-      if (can_encode_int32 (offset, 21))
-       p += emit_bcond (p, cond, offset);
-      else if (can_encode_int32 (offset, 28))
-       {
-         /* The offset is out of range for a conditional branch
-            instruction but not for a unconditional branch.  We can use
-            the following instructions instead:
+      /* The offset is out of range for a conditional branch
+        instruction but not for a unconditional branch.  We can use
+        the following instructions instead:
  
-              B.COND TAKEN    ; If cond is true, then jump to TAKEN.
-              B NOT_TAKEN     ; Else jump over TAKEN and continue.
-            TAKEN:
-              B #(offset - 8)
-            NOT_TAKEN:
+        B.COND TAKEN    ; If cond is true, then jump to TAKEN.
+        B NOT_TAKEN     ; Else jump over TAKEN and continue.
+        TAKEN:
+        B #(offset - 8)
+        NOT_TAKEN:
  
-            */
+      */
  
-         p += emit_bcond (p, cond, 8);
-         p += emit_b (p, 0, 8);
-         p += emit_b (p, 0, offset - 8);
-       }
-      else
-       return 0;
+      insn_reloc->insn_ptr += emit_bcond (insn_reloc->insn_ptr, cond, 8);
+      insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, 8);
+      insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, new_offset - 8);
      }
-  else if (aarch64_decode_cb (oldloc, insn, &is64, &is_cbnz, &rn, &offset))
-    {
-      offset = (oldloc - to + offset);
+}
  
-      if (can_encode_int32 (offset, 21))
-       p += emit_cb (p, is_cbnz, aarch64_register (rn, is64), offset);
-      else if (can_encode_int32 (offset, 28))
-       {
-         /* The offset is out of range for a compare and branch
-            instruction but not for a unconditional branch.  We can use
-            the following instructions instead:
-
-              CBZ xn, TAKEN   ; xn == 0, then jump to TAKEN.
-              B NOT_TAKEN     ; Else jump over TAKEN and continue.
-            TAKEN:
-              B #(offset - 8)
-            NOT_TAKEN:
-
-            */
-         p += emit_cb (p, is_cbnz, aarch64_register (rn, is64), 8);
-         p += emit_b (p, 0, 8);
-         p += emit_b (p, 0, offset - 8);
-       }
-      else
-       return 0;
+/* Implementation of aarch64_insn_visitor method "cb".  */
+
+static void
+aarch64_ftrace_insn_reloc_cb (const int32_t offset, const int is_cbnz,
+                             const unsigned rn, int is64,
+                             struct aarch64_insn_data *data)
+{
+  struct aarch64_insn_relocation_data *insn_reloc
+    = (struct aarch64_insn_relocation_data *) data;
+  int64_t new_offset
+    = insn_reloc->base.insn_addr - insn_reloc->new_addr + offset;
+
+  if (can_encode_int32 (new_offset, 21))
+    {
+      insn_reloc->insn_ptr += emit_cb (insn_reloc->insn_ptr, is_cbnz,
+                                      aarch64_register (rn, is64), new_offset);
      }
-  else if (aarch64_decode_tb (oldloc, insn, &is_tbnz, &bit, &rt, &offset))
+  else if (can_encode_int32 (new_offset, 28))
      {
-      offset = (oldloc - to + offset);
+      /* The offset is out of range for a compare and branch
+        instruction but not for a unconditional branch.  We can use
+        the following instructions instead:
+
+        CBZ xn, TAKEN   ; xn == 0, then jump to TAKEN.
+        B NOT_TAKEN     ; Else jump over TAKEN and continue.
+        TAKEN:
+        B #(offset - 8)
+        NOT_TAKEN:
+
+      */
+      insn_reloc->insn_ptr += emit_cb (insn_reloc->insn_ptr, is_cbnz,
+                                      aarch64_register (rn, is64), 8);
+      insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, 8);
+      insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, new_offset - 8);
+    }
+}
  
-      if (can_encode_int32 (offset, 16))
-       p += emit_tb (p, is_tbnz, bit, aarch64_register (rt, 1), offset);
-      else if (can_encode_int32 (offset, 28))
-       {
-         /* The offset is out of range for a test bit and branch
-            instruction but not for a unconditional branch.  We can use
-            the following instructions instead:
-
-              TBZ xn, #bit, TAKEN ; xn[bit] == 0, then jump to TAKEN.
-              B NOT_TAKEN         ; Else jump over TAKEN and continue.
-            TAKEN:
-              B #(offset - 8)
-            NOT_TAKEN:
-
-            */
-         p += emit_tb (p, is_tbnz, bit, aarch64_register (rt, 1), 8);
-         p += emit_b (p, 0, 8);
-         p += emit_b (p, 0, offset - 8);
-       }
-      else
-       return 0;
+/* Implementation of aarch64_insn_visitor method "tb".  */
+
+static void
+aarch64_ftrace_insn_reloc_tb (const int32_t offset, int is_tbnz,
+                             const unsigned rt, unsigned bit,
+                             struct aarch64_insn_data *data)
+{
+  struct aarch64_insn_relocation_data *insn_reloc
+    = (struct aarch64_insn_relocation_data *) data;
+  int64_t new_offset
+    = insn_reloc->base.insn_addr - insn_reloc->new_addr + offset;
+
+  if (can_encode_int32 (new_offset, 16))
+    {
+      insn_reloc->insn_ptr += emit_tb (insn_reloc->insn_ptr, is_tbnz, bit,
+                                      aarch64_register (rt, 1), new_offset);
      }
-  else if (aarch64_decode_adr (oldloc, insn, &is_adrp, &rd, &offset))
+  else if (can_encode_int32 (new_offset, 28))
      {
+      /* The offset is out of range for a test bit and branch
+        instruction but not for a unconditional branch.  We can use
+        the following instructions instead:
+
+        TBZ xn, #bit, TAKEN ; xn[bit] == 0, then jump to TAKEN.
+        B NOT_TAKEN         ; Else jump over TAKEN and continue.
+        TAKEN:
+        B #(offset - 8)
+        NOT_TAKEN:
+
+      */
+      insn_reloc->insn_ptr += emit_tb (insn_reloc->insn_ptr, is_tbnz, bit,
+                                      aarch64_register (rt, 1), 8);
+      insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0, 8);
+      insn_reloc->insn_ptr += emit_b (insn_reloc->insn_ptr, 0,
+                                     new_offset - 8);
+    }
+}
  
-      /* We know exactly the address the ADR{P,} instruction will compute.
-        We can just write it to the destination register.  */
-      CORE_ADDR address = oldloc + offset;
+/* Implementation of aarch64_insn_visitor method "adr".  */
  
-      if (is_adrp)
-       {
-         /* Clear the lower 12 bits of the offset to get the 4K page.  */
-         p += emit_mov_addr (p, aarch64_register (rd, 1),
-                             address & ~0xfff);
-       }
-      else
-       p += emit_mov_addr (p, aarch64_register (rd, 1), address);
-    }
-  else if (aarch64_decode_ldr_literal (oldloc, insn, &is_sw, &is64, &rt,
-                                      &offset))
+static void
+aarch64_ftrace_insn_reloc_adr (const int32_t offset, const unsigned rd,
+                              const int is_adrp,
+                              struct aarch64_insn_data *data)
+{
+  struct aarch64_insn_relocation_data *insn_reloc
+    = (struct aarch64_insn_relocation_data *) data;
+  /* We know exactly the address the ADR{P,} instruction will compute.
+     We can just write it to the destination register.  */
+  CORE_ADDR address = data->insn_addr + offset;
+
+  if (is_adrp)
      {
-      /* We know exactly what address to load from, and what register we
-        can use:
+      /* Clear the lower 12 bits of the offset to get the 4K page.  */
+      insn_reloc->insn_ptr += emit_mov_addr (insn_reloc->insn_ptr,
+                                            aarch64_register (rd, 1),
+                                            address & ~0xfff);
+    }
+  else
+    insn_reloc->insn_ptr += emit_mov_addr (insn_reloc->insn_ptr,
+                                          aarch64_register (rd, 1), address);
+}
  
-          MOV xd, #(oldloc + offset)
-          MOVK xd, #((oldloc + offset) >> 16), lsl #16
-          ...
+/* Implementation of aarch64_insn_visitor method "ldr_literal".  */
  
-          LDR xd, [xd] ; or LDRSW xd, [xd]
+static void
+aarch64_ftrace_insn_reloc_ldr_literal (const int32_t offset, const int is_sw,
+                                      const unsigned rt, const int is64,
+                                      struct aarch64_insn_data *data)
+{
+  struct aarch64_insn_relocation_data *insn_reloc
+    = (struct aarch64_insn_relocation_data *) data;
+  CORE_ADDR address = data->insn_addr + offset;
  
-        */
-      CORE_ADDR address = oldloc + offset;
+  insn_reloc->insn_ptr += emit_mov_addr (insn_reloc->insn_ptr,
+                                        aarch64_register (rt, 1), address);
  
-      p += emit_mov_addr (p, aarch64_register (rt, 1), address);
+  /* We know exactly what address to load from, and what register we
+     can use:
  
-      if (is_sw)
-       p += emit_ldrsw (p, aarch64_register (rt, 1),
-                        aarch64_register (rt, 1),
-                        offset_memory_operand (0));
-      else
-       p += emit_ldr (p, aarch64_register (rt, is64),
-                      aarch64_register (rt, 1),
-                      offset_memory_operand (0));
-    }
+     MOV xd, #(oldloc + offset)
+     MOVK xd, #((oldloc + offset) >> 16), lsl #16
+     ...
+
+     LDR xd, [xd] ; or LDRSW xd, [xd]
+
+  */
+
+  if (is_sw)
+    insn_reloc->insn_ptr += emit_ldrsw (insn_reloc->insn_ptr,
+                                       aarch64_register (rt, 1),
+                                       aarch64_register (rt, 1),
+                                       offset_memory_operand (0));
    else
-    {
-      /* The instruction is not PC relative.  Just re-emit it at the new
-        location.  */
-      p += emit_insn (p, insn);
-    }
+    insn_reloc->insn_ptr += emit_ldr (insn_reloc->insn_ptr,
+                                     aarch64_register (rt, is64),
+                                     aarch64_register (rt, 1),
+                                     offset_memory_operand (0));
+}
+
+/* Implementation of aarch64_insn_visitor method "others".  */
  
-  return (int) (p - buf);
+static void
+aarch64_ftrace_insn_reloc_others (const uint32_t insn,
+                                 struct aarch64_insn_data *data)
+{
+  struct aarch64_insn_relocation_data *insn_reloc
+    = (struct aarch64_insn_relocation_data *) data;
+
+  /* The instruction is not PC relative.  Just re-emit it at the new
+     location.  */
+  insn_reloc->insn_ptr += aarch64_emit_insn (insn_reloc->insn_ptr, insn);
  }
  
+static const struct aarch64_insn_visitor visitor =
+{
+  aarch64_ftrace_insn_reloc_b,
+  aarch64_ftrace_insn_reloc_b_cond,
+  aarch64_ftrace_insn_reloc_cb,
+  aarch64_ftrace_insn_reloc_tb,
+  aarch64_ftrace_insn_reloc_adr,
+  aarch64_ftrace_insn_reloc_ldr_literal,
+  aarch64_ftrace_insn_reloc_others,
+};
+
  /* Implementation of linux_target_ops method
     "install_fast_tracepoint_jump_pad".  */
  
@@ -2115,10 +1884,11 @@ aarch64_install_fast_tracepoint_jump_pad (CORE_ADDR tpoint,
  {
    uint32_t buf[256];
    uint32_t *p = buf;
-  int32_t offset;
+  int64_t offset;
    int i;
    uint32_t insn;
    CORE_ADDR buildaddr = *jump_entry;
+  struct aarch64_insn_relocation_data insn_data;
  
    /* We need to save the current state on the stack both to restore it
       later and to collect register values when the tracepoint is hit.
@@ -2421,9 +2191,16 @@ aarch64_install_fast_tracepoint_jump_pad (CORE_ADDR tpoint,
    /* Now emit the relocated instruction.  */
    *adjusted_insn_addr = buildaddr;
    target_read_uint32 (tpaddr, &insn);
-  i = aarch64_relocate_instruction (buildaddr, tpaddr, insn, buf);
+
+  insn_data.base.insn_addr = tpaddr;
+  insn_data.new_addr = buildaddr;
+  insn_data.insn_ptr = buf;
+
+  aarch64_relocate_instruction (insn, &visitor,
+                               (struct aarch64_insn_data *) &insn_data);
+
    /* We may not have been able to relocate the instruction.  */
-  if (i == 0)
+  if (insn_data.insn_ptr == buf)
      {
        sprintf (err,
                "E.Could not relocate instruction from %s to %s.",
@@ -2432,7 +2209,7 @@ aarch64_install_fast_tracepoint_jump_pad (CORE_ADDR tpoint,
        return 1;
      }
    else
-    append_insns (&buildaddr, i, buf);
+    append_insns (&buildaddr, insn_data.insn_ptr - buf, buf);
    *adjusted_insn_addr_end = buildaddr;
  
    /* Go back to the start of the buffer.  */
@@ -2444,7 +2221,7 @@ aarch64_install_fast_tracepoint_jump_pad (CORE_ADDR tpoint,
      {
        sprintf (err,
                "E.Jump back from jump pad too far from tracepoint "
-              "(offset 0x%" PRIx32 " cannot be encoded in 28 bits).",
+              "(offset 0x%" PRIx64 " cannot be encoded in 28 bits).",
                offset);
        return 1;
      }
@@ -2458,7 +2235,7 @@ aarch64_install_fast_tracepoint_jump_pad (CORE_ADDR tpoint,
      {
        sprintf (err,
                "E.Jump pad too far from tracepoint "
-              "(offset 0x%" PRIx32 " cannot be encoded in 28 bits).",
+              "(offset 0x%" PRIx64 " cannot be encoded in 28 bits).",
                offset);
        return 1;
      }
@@ -2583,7 +2360,7 @@ aarch64_emit_add (void)
    uint32_t *p = buf;
  
    p += emit_pop (p, x1);
-  p += emit_add (p, x0, x0, register_operand (x1));
+  p += emit_add (p, x0, x1, register_operand (x0));
  
    emit_ops_insns (buf, p - buf);
  }
@@ -2597,7 +2374,7 @@ aarch64_emit_sub (void)
    uint32_t *p = buf;
  
    p += emit_pop (p, x1);
-  p += emit_sub (p, x0, x0, register_operand (x1));
+  p += emit_sub (p, x0, x1, register_operand (x0));
  
    emit_ops_insns (buf, p - buf);
  }
@@ -3229,18 +3006,63 @@ aarch64_supports_range_stepping (void)
    return 1;
  }
  
+/* Implementation of linux_target_ops method "sw_breakpoint_from_kind".  */
+
+static const gdb_byte *
+aarch64_sw_breakpoint_from_kind (int kind, int *size)
+{
+  if (is_64bit_tdesc ())
+    {
+      *size = aarch64_breakpoint_len;
+      return aarch64_breakpoint;
+    }
+  else
+    return arm_sw_breakpoint_from_kind (kind, size);
+}
+
+/* Implementation of linux_target_ops method "breakpoint_kind_from_pc".  */
+
+static int
+aarch64_breakpoint_kind_from_pc (CORE_ADDR *pcptr)
+{
+  if (is_64bit_tdesc ())
+    return aarch64_breakpoint_len;
+  else
+    return arm_breakpoint_kind_from_pc (pcptr);
+}
+
+/* Implementation of the linux_target_ops method
+   "breakpoint_kind_from_current_state".  */
+
+static int
+aarch64_breakpoint_kind_from_current_state (CORE_ADDR *pcptr)
+{
+  if (is_64bit_tdesc ())
+    return aarch64_breakpoint_len;
+  else
+    return arm_breakpoint_kind_from_current_state (pcptr);
+}
+
+/* Support for hardware single step.  */
+
+static int
+aarch64_supports_hardware_single_step (void)
+{
+  return 1;
+}
+
  struct linux_target_ops the_low_target =
  {
    aarch64_arch_setup,
    aarch64_regs_info,
-  aarch64_cannot_fetch_register,
-  aarch64_cannot_store_register,
+  NULL, /* cannot_fetch_register */
+  NULL, /* cannot_store_register */
    NULL, /* fetch_register */
    aarch64_get_pc,
    aarch64_set_pc,
-  (const unsigned char *) &aarch64_breakpoint,
-  aarch64_breakpoint_len,
-  NULL, /* breakpoint_reinsert_addr */
+  aarch64_breakpoint_kind_from_pc,
+  aarch64_sw_breakpoint_from_kind,
+  NULL, /* get_next_pcs */
    0,    /* decr_pc_after_break */
    aarch64_breakpoint_at,
    aarch64_supports_z_point_type,
@@ -3252,7 +3074,9 @@ struct linux_target_ops the_low_target =
    NULL, /* supply_ptrace_register */
    aarch64_linux_siginfo_fixup,
    aarch64_linux_new_process,
+  aarch64_linux_delete_process,
    aarch64_linux_new_thread,
+  aarch64_linux_delete_thread,
    aarch64_linux_new_fork,
    aarch64_linux_prepare_to_resume,
    NULL, /* process_qsupported */
@@ -3262,14 +3086,16 @@ struct linux_target_ops the_low_target =
    aarch64_emit_ops,
    aarch64_get_min_fast_tracepoint_insn_len,
    aarch64_supports_range_stepping,
+  aarch64_breakpoint_kind_from_current_state,
+  aarch64_supports_hardware_single_step,
+  aarch64_get_syscall_trapinfo,
  };
  
  void
  initialize_low_arch (void)
  {
-  init_registers_aarch64 ();
-
    initialize_low_arch_aarch32 ();
  
    initialize_regsets_info (&aarch64_regsets_info);
+  initialize_regsets_info (&aarch64_sve_regsets_info);
  }