diff mbox

[AArch64] Add falkor pipeline description.

Message ID 1501710884-7378-1-git-send-email-jim.wilson@linaro.org
State New
Headers show

Commit Message

Jim Wilson Aug. 2, 2017, 9:54 p.m. UTC
This adds a pipeline description for the Qualcomm Falkor core.  This was
tested with a bootstrap and make check.  There were no regressions.  This
gives about 0.5% performance gain on SPEC CPU2006 on our internal tree, which
has a few other patches that aren't in the FSF tree yet.

OK?

Jim

	gcc/
	* config/aarch64/aarch64-cores.def (falkor): Use falkor pipeline.
	(qdf24xx): Likewise.
	* config/aarch64/aarch64.md: Include falkor.md.
	* config/aarch64/falkor.md: New.
---
 gcc/config/aarch64/aarch64-cores.def |   4 +-
 gcc/config/aarch64/aarch64.md        |   1 +
 gcc/config/aarch64/falkor.md         | 681 +++++++++++++++++++++++++++++++++++
 3 files changed, 684 insertions(+), 2 deletions(-)
 create mode 100644 gcc/config/aarch64/falkor.md

-- 
2.7.4

Comments

Richard Earnshaw (lists) Aug. 7, 2017, 1:20 p.m. UTC | #1
On 02/08/17 22:54, Jim Wilson wrote:
> This adds a pipeline description for the Qualcomm Falkor core.  This was

> tested with a bootstrap and make check.  There were no regressions.  This

> gives about 0.5% performance gain on SPEC CPU2006 on our internal tree, which

> has a few other patches that aren't in the FSF tree yet.

> 

> OK?

> 


OK.

R.

> Jim

> 

> 	gcc/

> 	* config/aarch64/aarch64-cores.def (falkor): Use falkor pipeline.

> 	(qdf24xx): Likewise.

> 	* config/aarch64/aarch64.md: Include falkor.md.

> 	* config/aarch64/falkor.md: New.

> ---

>  gcc/config/aarch64/aarch64-cores.def |   4 +-

>  gcc/config/aarch64/aarch64.md        |   1 +

>  gcc/config/aarch64/falkor.md         | 681 +++++++++++++++++++++++++++++++++++

>  3 files changed, 684 insertions(+), 2 deletions(-)

>  create mode 100644 gcc/config/aarch64/falkor.md

> 

> diff --git a/gcc/config/aarch64/aarch64-cores.def b/gcc/config/aarch64/aarch64-cores.def

> index b8d0ba6..1089332 100644

> --- a/gcc/config/aarch64/aarch64-cores.def

> +++ b/gcc/config/aarch64/aarch64-cores.def

> @@ -65,8 +65,8 @@ AARCH64_CORE("thunderxt83",   thunderxt83,   thunderx,  8A,  AARCH64_FL_FOR_ARCH

>  AARCH64_CORE("xgene1",      xgene1,    xgene1,    8A,  AARCH64_FL_FOR_ARCH8, xgene1, 0x50, 0x000, -1)

>  

>  /* Qualcomm ('Q') cores. */

> -AARCH64_CORE("falkor",      falkor,    cortexa57, 8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO | AARCH64_FL_RDMA, qdf24xx,   0x51, 0xC00, -1)

> -AARCH64_CORE("qdf24xx",     qdf24xx,   cortexa57, 8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO | AARCH64_FL_RDMA, qdf24xx,   0x51, 0xC00, -1)

> +AARCH64_CORE("falkor",      falkor,    falkor,    8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO | AARCH64_FL_RDMA, qdf24xx,   0x51, 0xC00, -1)

> +AARCH64_CORE("qdf24xx",     qdf24xx,   falkor,    8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO | AARCH64_FL_RDMA, qdf24xx,   0x51, 0xC00, -1)

>  

>  /* Samsung ('S') cores. */

>  AARCH64_CORE("exynos-m1",   exynosm1,  exynosm1,  8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO, exynosm1,  0x53, 0x001, -1)

> diff --git a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md

> index fc79947..51061b2 100644

> --- a/gcc/config/aarch64/aarch64.md

> +++ b/gcc/config/aarch64/aarch64.md

> @@ -231,6 +231,7 @@

>  (include "../arm/cortex-a53.md")

>  (include "../arm/cortex-a57.md")

>  (include "../arm/exynos-m1.md")

> +(include "falkor.md")

>  (include "thunderx.md")

>  (include "../arm/xgene1.md")

>  (include "thunderx2t99.md")

> diff --git a/gcc/config/aarch64/falkor.md b/gcc/config/aarch64/falkor.md

> new file mode 100644

> index 0000000..b422ab3

> --- /dev/null

> +++ b/gcc/config/aarch64/falkor.md

> @@ -0,0 +1,681 @@

> +;; Falkor pipeline description

> +;; Copyright (C) 2017 Free Software Foundation, Inc.

> +;;

> +;; This file is part of GCC.

> +;;

> +;; GCC is free software; you can redistribute it and/or modify it

> +;; under the terms of the GNU General Public License as published by

> +;; the Free Software Foundation; either version 3, or (at your option)

> +;; any later version.

> +;;

> +;; GCC is distributed in the hope that it will be useful, but

> +;; WITHOUT ANY WARRANTY; without even the implied warranty of

> +;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

> +;; General Public License for more details.

> +;;

> +;; You should have received a copy of the GNU General Public License

> +;; along with GCC; see the file COPYING3.  If not see

> +;; <http://www.gnu.org/licenses/>.

> +

> +(define_automaton "falkor")

> +

> +;; Complex int instructions (e.g. multiply and divide) execute in the X

> +;; pipeline.  Simple int instructions execute in the X, Y, and Z pipelines.

> +

> +(define_cpu_unit "falkor_x" "falkor")

> +(define_cpu_unit "falkor_y" "falkor")

> +(define_cpu_unit "falkor_z" "falkor")

> +

> +;; Branches execute in the B pipeline or in one of the int pipelines depending

> +;; on how complex it is.  Simple int insns (like movz) can also execute here.

> +

> +(define_cpu_unit "falkor_b" "falkor")

> +

> +;; Vector and FP insns execute in the VX and VY pipelines.

> +

> +(define_automaton "falkor_vfp")

> +

> +(define_cpu_unit "falkor_vx" "falkor_vfp")

> +(define_cpu_unit "falkor_vy" "falkor_vfp")

> +

> +;; Loads execute in the LD pipeline.

> +;; Stores execute in the ST, SD, and VSD pipelines, for address, data, and

> +;; vector data.

> +

> +(define_automaton "falkor_mem")

> +

> +(define_cpu_unit "falkor_ld" "falkor_mem")

> +(define_cpu_unit "falkor_st" "falkor_mem")

> +(define_cpu_unit "falkor_sd" "falkor_mem")

> +(define_cpu_unit "falkor_vsd" "falkor_mem")

> +

> +;; The GTOV and VTOG pipelines are for general to vector reg moves, and vice

> +;; versa.

> +

> +(define_cpu_unit "falkor_gtov" "falkor")

> +(define_cpu_unit "falkor_vtog" "falkor")

> +

> +;; Common reservation combinations.

> +

> +(define_reservation "falkor_vxvy" "falkor_vx|falkor_vy")

> +(define_reservation "falkor_zb"   "falkor_z|falkor_b")

> +(define_reservation "falkor_xyz"  "falkor_x|falkor_y|falkor_z")

> +(define_reservation "falkor_xyzb" "falkor_x|falkor_y|falkor_z|falkor_b")

> +

> +;; SIMD Floating-Point Instructions

> +

> +(define_insn_reservation "falkor_afp_1_vxvy" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_neg_s,neon_fp_neg_d,neon_fp_abs_s,neon_fp_abs_d"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_1_vxvy_vxvy" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_neg_s_q,neon_fp_neg_d_q,neon_fp_abs_s_q,neon_fp_abs_d_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_2_vxvy" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_minmax_s,neon_fp_minmax_d,neon_fp_reduc_minmax_s,neon_fp_reduc_minmax_d,neon_fp_compare_s,neon_fp_compare_d,neon_fp_round_s,neon_fp_round_d"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_2_vxvy_vxvy" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_minmax_s_q,neon_fp_minmax_d_q,neon_fp_compare_s_q,neon_fp_compare_d_q,neon_fp_round_s_q,neon_fp_round_d_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_3_vxvy" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_reduc_minmax_s_q,neon_fp_reduc_minmax_d_q,neon_fp_abd_s,neon_fp_abd_d,neon_fp_addsub_s,neon_fp_addsub_d,neon_fp_reduc_add_s,neon_fp_reduc_add_d"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_3_vxvy_vxvy" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_abd_s_q,neon_fp_abd_d_q,neon_fp_addsub_s_q,neon_fp_addsub_d_q,neon_fp_reduc_add_s_q,neon_fp_reduc_add_d_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_4_vxvy" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_to_int_s,neon_fp_to_int_d,neon_int_to_fp_s,neon_int_to_fp_d,neon_fp_cvt_widen_h,neon_fp_cvt_widen_s"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_4_vxvy_vxvy" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_to_int_s_q,neon_fp_to_int_d_q,neon_int_to_fp_s_q,neon_int_to_fp_d_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_5_vxvy_mul" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_mul_s,neon_fp_mul_s_scalar"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_5_vxvy_mla" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_mla_s,neon_fp_mla_s_scalar"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_5_vxvy_vxvy_mul" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_mul_s_q,neon_fp_mul_s_scalar_q"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_5_vxvy_vxvy_mla" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_mla_s_q,neon_fp_mla_s_scalar_q"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_6_vxvy_mul" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_mul_d"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_6_vxvy_mla" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_mla_d"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_6_vxvy_vxvy_mul" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_mul_d_q,neon_fp_mul_d_scalar_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_6_vxvy_vxvy_mla" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_mla_d_q,neon_fp_mla_d_scalar_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_4_vxvy_vxvy_vxvy" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_cvt_narrow_s_q,neon_fp_cvt_narrow_d_q"))

> +  "falkor_vxvy+falkor_vxvy,falkor_vxvy")

> +

> +(define_insn_reservation "falkor_afp_6_vx_vy" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_div_s"))

> +  "falkor_vx+falkor_vy")

> +

> +(define_insn_reservation "falkor_afp_11_vx_vy" 11

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_div_d"))

> +  "falkor_vx+falkor_vy")

> +

> +(define_insn_reservation "falkor_afp_6_vx_vy_vx_vy" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_div_s_q"))

> +  "(falkor_vx+falkor_vy),(falkor_vx+falkor_vy)")

> +

> +(define_insn_reservation "falkor_afp_11_vx_vy_vx_vy" 11

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_div_d_q"))

> +  "(falkor_vx+falkor_vy),(falkor_vx+falkor_vy)")

> +

> +(define_insn_reservation "falkor_afp_12_vx_vy" 12

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_sqrt_s"))

> +  "falkor_vx+falkor_vy")

> +

> +(define_insn_reservation "falkor_afp_22_vx_vy" 22

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_sqrt_d"))

> +  "falkor_vx+falkor_vy")

> +

> +(define_insn_reservation "falkor_afp_12_vx_vy_vx_vy" 12

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_sqrt_s_q"))

> +  "(falkor_vx+falkor_vy),(falkor_vx+falkor_vy)")

> +

> +(define_insn_reservation "falkor_afp_22_vx_vy_vx_vy" 22

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_sqrt_d_q"))

> +  "(falkor_vx+falkor_vy),(falkor_vx+falkor_vy)")

> +

> +;; SIMD Integer Instructions

> +

> +(define_insn_reservation "falkor_ai_1_vxvy" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_add,neon_reduc_add,neon_logic,neon_neg,neon_sub"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_1_vxvy_vxvy" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_shift_imm_long,neon_add_q,neon_reduc_add_q,neon_logic_q,neon_neg_q,neon_sub_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_2_vxvy" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_add_long,neon_sub_long,neon_add_halve,neon_sub_halve,neon_shift_imm,neon_shift_reg,neon_minmax,neon_abs,neon_compare,neon_compare_zero,neon_tst"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_2_vxvy_vxvy" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_add_halve_q,neon_sub_halve_q,neon_shift_imm_q,neon_shift_reg_q,neon_minmax_q,neon_abs_q,neon_compare_q,neon_compare_zero_q,neon_tst_q,neon_reduc_add_long"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_3_vxvy" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_shift_acc,neon_reduc_add_acc,neon_abd,neon_qadd,neon_qsub,neon_qabs,neon_qneg,neon_sat_shift_imm,neon_sat_shift_imm_narrow_q,neon_sat_shift_reg,neon_reduc_minmax"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_4_vxvy" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_reduc_minmax_q"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_3_vxvy_vxvy" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_shift_acc_q,neon_reduc_add_acc_q,neon_abd_q,neon_abd_long,neon_qadd_q,neon_qsub_q,neon_qabs_q,neon_qneg_q,neon_sat_shift_imm_q,neon_sat_shift_reg_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_4_vxvy_mul" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_mul_b,neon_mul_h,neon_mul_s,neon_mul_h_scalar,neon_mul_s_scalar,neon_sat_mul_b,neon_sat_mul_h,neon_sat_mul_s,neon_sat_mul_h_scalar,neon_sat_mul_s_scalar"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_4_vxvy_mla" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_mla_b,neon_mla_h,neon_mla_s,neon_mla_h_scalar,neon_mla_s_scalar"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_4_vxvy_vxvy_mul" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_mul_b_q,neon_mul_h_q,neon_mul_s_q,neon_mul_h_scalar_q,neon_mul_s_scalar_q,neon_sat_mul_b_q,neon_sat_mul_h_q,neon_sat_mul_s_q,neon_mul_b_long,neon_mul_h_long,neon_mul_s_long,neon_mul_d_long,neon_mul_h_scalar_long,neon_mul_s_scalar_long,neon_sat_mul_b_long,neon_sat_mul_h_long,neon_sat_mul_s_long,neon_sat_mul_h_scalar_q,neon_sat_mul_s_scalar_q,neon_sat_mul_h_scalar_long,neon_sat_mul_s_scalar_long"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_4_vxvy_vxvy_mla" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_mla_b_q,neon_mla_h_q,neon_mla_s_q,neon_mla_h_scalar_q,neon_mla_s_scalar_q,neon_mla_b_long,neon_mla_h_long,neon_mla_s_long,neon_mla_h_scalar_long,neon_mla_s_scalar_long,neon_sat_mla_b_long,neon_sat_mla_h_long,neon_sat_mla_s_long,neon_sat_mla_h_scalar_long,neon_sat_mla_s_scalar_long"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_ai_4_vxvy_vxvy" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_add_halve_narrow_q,neon_sub_halve_narrow_q,neon_arith_acc"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_2_ai_vxvy_vxvy_vxvy_vxvy" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_add_widen,neon_sub_widen"))

> +  "(falkor_vxvy+falkor_vxvy),(falkor_vxvy+falkor_vxvy)")

> +

> +(define_insn_reservation "falkor_4_ai_vxvy_vxvy_vxvy_vxvy" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_arith_acc_q"))

> +  "(falkor_vxvy+falkor_vxvy),(falkor_vxvy+falkor_vxvy)")

> +

> +;; SIMD Load Instructions

> +

> +(define_insn_reservation "falkor_ald_4_ld" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_load1_1reg,neon_load1_1reg_q,neon_load1_all_lanes,neon_load2_one_lane"))

> +  "falkor_ld")

> +

> +(define_insn_reservation "falkor_ald_4_ld_none" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_load1_2reg,neon_load2_2reg,neon_load2_all_lanes"))

> +  "falkor_ld")

> +

> +(define_insn_reservation "falkor_ald_4_ld_ld" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_load1_2reg_q,neon_load2_2reg_q,neon_load2_all_lanes_q,neon_load3_one_lane,neon_load4_one_lane,neon_ldp,neon_ldp_q"))

> +  "falkor_ld,falkor_ld")

> +

> +(define_insn_reservation "falkor_ald_4_ld_ld_none" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_load1_3reg,neon_load3_3reg,neon_load3_all_lanes"))

> +  "falkor_ld,falkor_ld")

> +

> +(define_insn_reservation "falkor_ald_4_ld_ld_ld" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_load1_3reg_q,neon_load3_3reg_q,neon_load3_all_lanes_q"))

> +  "falkor_ld,falkor_ld,falkor_ld")

> +

> +(define_insn_reservation "falkor_ald_4_ld_ld_none_none" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_load1_4reg,neon_load4_4reg"))

> +  "falkor_ld,falkor_ld")

> +

> +(define_insn_reservation "falkor_ald_4_ld_ld_ld_ld" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_load1_4reg_q,neon_load4_4reg_q,neon_load4_all_lanes,neon_load4_all_lanes_q"))

> +  "falkor_ld,falkor_ld,falkor_ld,falkor_ld")

> +

> +;; Arithmetic and Logical Instructions

> +

> +(define_insn_reservation "falkor_alu_1_xyz" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "alus_sreg,alus_imm,alus_shift_imm,csel,adc_reg,alu_imm,alu_sreg,alu_shift_imm,alu_ext,alus_ext,logic_imm,logic_reg,logic_shift_imm,logics_imm,logics_reg,logics_shift_imm,mov_reg"))

> +  "falkor_xyz")

> +

> +;; SIMD Miscellaneous Instructions

> +

> +;; No separate type for ins and dup.  But this is correct for both.

> +

> +(define_insn_reservation "falkor_am_3_gtov" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_from_gp"))

> +  "falkor_gtov")

> +

> +;; No separate type for ins and dup.  Assuming dup is more common.  Ins is

> +;; gtov+vxvy and latency of 4.

> +

> +(define_insn_reservation "falkor_am_3_gtov_gtov" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_from_gp_q"))

> +  "falkor_gtov,falkor_gtov")

> +

> +;; neon_to_gp_q is used for 32-bit ARM instructions that move 64-bits of data

> +;; so no use needed here.

> +

> +(define_insn_reservation "falkor_am_3_vtog" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_to_gp"))

> +  "falkor_vtog")

> +

> +(define_insn_reservation "falkor_am_1_vxvy" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_bsl,neon_dup,neon_ext,neon_ins,neon_ins_q,neon_move,neon_rev,neon_tbl1,neon_permute,neon_shift_imm_narrow_q"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_1_vxvy_vxvy" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_bsl_q,neon_dup_q,neon_ext_q,neon_move_q,neon_rev_q,neon_tbl1_q,neon_permute_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_2_vxvy" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_cls,neon_cnt,neon_rbit"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_4_vxvy_vxvy" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_cls_q,neon_cnt_q,neon_rbit_q,neon_tbl2"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_3_vxvy" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_recpe_s,neon_fp_recpe_d,neon_fp_rsqrte_s,neon_fp_rsqrte_d,neon_fp_recpx_s,neon_fp_recpx_d"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_3_vxvy_vxvy" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_recpe_s_q,neon_fp_recpe_d_q,neon_fp_rsqrte_s_q,neon_fp_rsqrte_d_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_5_vxvy" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_recps_s"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_5_vxvy_vxvy" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_recps_s_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_6_vxvy" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_recps_d,neon_fp_rsqrts_d"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_6_vxvy_vxvy" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_fp_recps_d_q,neon_fp_rsqrts_d_q"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_5_vxvy_vxvy_vxvy" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_tbl2_q,neon_tbl3"))

> +  "(falkor_vxvy+falkor_vxvy),falkor_vxvy")

> +

> +(define_insn_reservation "falkor_am_6_vxvy_vxvy_vxvy_vxvy" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_tbl3_q,neon_tbl4"))

> +  "(falkor_vxvy+falkor_vxvy),(falkor_vxvy+falkor_vxvy)")

> +

> +(define_insn_reservation "falkor_am_7_vxvy_vxvy_vxvy_vxvy_vxvy" 7

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_tbl4_q"))

> +  "(falkor_vxvy+falkor_vxvy),(falkor_vxvy+falkor_vxvy),falkor_vxvy")

> +

> +;; SIMD Store Instructions

> +

> +;; ??? stp is neon_store1_2reg in aarch64.md, but neon_stp in aarch64-simd.md.

> +;; Similarly with ldp.

> +

> +(define_insn_reservation "falkor_ast_st_vsd" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_store1_1reg,neon_store1_1reg_q,neon_store1_one_lane,neon_store1_one_lane_q,neon_store1_2reg,neon_store2_2reg,neon_store2_one_lane,neon_store2_one_lane_q,neon_stp"))

> +  "falkor_st+falkor_vsd")

> +

> +(define_insn_reservation "falkor_as_0_st_vsd_st_vsd" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_store1_2reg_q,neon_store1_3reg,neon_store1_4reg,neon_store2_2reg_q,neon_store3_3reg,neon_store4_4reg,neon_store3_one_lane,neon_store3_one_lane_q,neon_store4_one_lane,neon_store4_one_lane_q,neon_stp_q"))

> +  "(falkor_st+falkor_vsd),(falkor_st+falkor_vsd)")

> +

> +(define_insn_reservation "falkor_as_0_st_vsd_st_vsd_st_vsd" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_store1_3reg_q,neon_store3_3reg_q"))

> +  "(falkor_st+falkor_vsd),(falkor_st+falkor_vsd),(falkor_st+falkor_vsd)")

> +

> +(define_insn_reservation "falkor_as_0_st_vsd_st_vsd_st_vsd_st_vsd" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "neon_store1_4reg_q,neon_store4_4reg_q"))

> +  "(falkor_st+falkor_vsd),(falkor_st+falkor_vsd),(falkor_st+falkor_vsd),(falkor_st+falkor_vsd)")

> +

> +;; Branch Instructions

> +

> +(define_insn_reservation "falkor_branch_0_zb" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "branch"))

> +  "falkor_zb")

> +

> +(define_insn_reservation "falkor_call_0_xyzb" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "call"))

> +  "falkor_xyzb")

> +

> +;; Cryptography Extensions

> +

> +(define_insn_reservation "falkor_cry_1_vxvy" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "crypto_sha1_fast"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_cry_2_vxvy" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "crypto_aesmc"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_cry_2_vxvy_vxvy" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "crypto_sha1_xor,crypto_sha256_fast,crypto_pmull"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +(define_insn_reservation "falkor_cry_4_vy_vx" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "crypto_sha1_slow"))

> +  "falkor_vy+falkor_vx")

> +

> +(define_insn_reservation "falkor_cry_6_vy_vx" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "crypto_sha256_slow"))

> +  "falkor_vy+falkor_vx")

> +

> +(define_insn_reservation "falkor_cry_3_vxvy_vxvy" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "crypto_aese"))

> +  "falkor_vxvy+falkor_vxvy")

> +

> +;; FP Load Instructions

> +

> +(define_insn_reservation "falkor_fld_4_ld" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "f_loads,f_loadd"))

> +  "falkor_ld")

> +

> +;; No separate FP store section, these are found in the SIMD store section.

> +

> +(define_insn_reservation "falkor_fld_0_st_vsd" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "f_stores,f_stored"))

> +  "falkor_st+falkor_vsd")

> +

> +;; FP Data Processing Instructions

> +

> +(define_insn_reservation "falkor_fpdt_0_vxvy" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fcmps,fcmpd,fccmps,fccmpd"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_fpdt_5_vtog" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "f_cvtf2i"))

> +  "falkor_vtog")

> +

> +(define_insn_reservation "falkor_fpdt_1_vxvy" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "ffariths,ffarithd,fcsel"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_fpdt_2_vxvy" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "f_minmaxd,f_minmaxs,f_rintd,f_rints"))

> +  "falkor_vxvy")

> +

> +;; Scalar FP ABD is handled same as vector FP ABD.

> +

> +(define_insn_reservation "falkor_fpdt_3_vxvy" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "faddd,fadds"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_fpdt_4_vxvy" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "f_cvt"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_fpdt_5_vxvy_mul" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fmuls"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_fpdt_5_vxvy_mla" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fmacs,ffmas"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_fpdt_6_vxvy_mul" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fmuld"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_fpdt_6_vxvy_mla" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fmacd,ffmad"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_fpdt_6_vx_vy" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fdivs"))

> +  "falkor_vx+falkor_vy")

> +

> +(define_insn_reservation "falkor_fpdt_11_vx_vy" 11

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fdivd"))

> +  "falkor_vx+falkor_vy")

> +

> +(define_insn_reservation "falkor_fpdt_12_vx_vy" 12

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fsqrts"))

> +  "falkor_vxvy")

> +

> +(define_insn_reservation "falkor_fpdt_22_vx_vy" 22

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fsqrtd"))

> +  "falkor_vxvy")

> +

> +;; FP Miscellaneous Instructions

> +

> +(define_insn_reservation "falkor_fpmsc_3_vtog" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "f_mrc"))

> +  "falkor_vtog")

> +

> +(define_insn_reservation "falkor_fpmsc_3_gtov" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "f_mcr"))

> +  "falkor_gtov")

> +

> +(define_insn_reservation "falkor_fpmsc_1_vxvy" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "fmov,fconsts,fconstd"))

> +  "falkor_vxvy")

> +

> +;; No separate type for float-to-fixed conversions.  Same type as

> +;; float-to-int conversions.  They schedule the same though, so no problem.

> +

> +(define_insn_reservation "falkor_fpmsc_6_gtov" 6

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "f_cvti2f"))

> +  "falkor_gtov")

> +

> +;; Load Instructions

> +

> +(define_insn_reservation "falkor_ld_3_ld" 3

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "load1,load2"))

> +  "falkor_ld")

> +

> +;; Miscellaneous Data-Processing Instructions

> +

> +(define_insn_reservation "falkor_misc_1_xyz" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "bfx,bfm,extend,rotate_imm,shift_imm"))

> +  "falkor_xyz")

> +

> +(define_insn_reservation "falkor_misc_2_x" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "crc"))

> +  "falkor_x")

> +

> +(define_insn_reservation "falkor_misc_2_xyz" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "clz,rbit,rev"))

> +  "falkor_xyz")

> +

> +;; Divide and Multiply Instructions

> +

> +(define_insn_reservation "falkor_muldiv_4_x_mul" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "mul"))

> +  "falkor_x")

> +

> +(define_insn_reservation "falkor_muldiv_4_x_mla" 4

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "mla,smlal,umlal"))

> +  "falkor_x")

> +

> +(define_insn_reservation "falkor_muldiv_5_x_mul" 5

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "smull,umull"))

> +  "falkor_x")

> +

> +(define_insn_reservation "falkor_md_11_x_z" 11

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "sdiv,udiv"))

> +  "falkor_x+falkor_z")

> +

> +;; Move and Shift Instructions

> +

> +(define_insn_reservation "falkor_mvs_1_xyz" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "mov_imm,shift_reg"))

> +  "falkor_xyz")

> +

> +(define_insn_reservation "falkor_mvs_1_xyzb" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "adr"))

> +  "falkor_xyzb")

> +

> +;; Other Instructions

> +

> +;; Block is for instruction scheduling blockage insns in RTL.  There are no

> +;; hardware instructions emitted for them, so don't use any resources.

> +

> +(define_insn_reservation "falkor_other_0_nothing" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "no_insn,trap,block"))

> +  "nothing")

> +

> +(define_insn_reservation "falkor_other_2_z" 2

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "mrs"))

> +  "falkor_z")

> +

> +;; Assume multiple instructions use all pipes.

> +

> +(define_insn_reservation "falkor_extra" 1

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "multiple"))

> +  "falkor_x+falkor_y+falkor_z+falkor_b+falkor_vx+falkor_vy+falkor_ld+falkor_st+falkor_sd+falkor_vsd+falkor_gtov+falkor_vtog")

> +

> +;; Store Instructions

> +

> +;; No use of store_rel, store3, or store4 in aarch64.

> +

> +(define_insn_reservation "falkor_st_0_st_sd" 0

> +  (and (eq_attr "tune" "falkor")

> +       (eq_attr "type" "store1,store2"))

> +  "falkor_st+falkor_sd")

> +

> +;; Muliply bypasses.

> +

> +;; 1 cycle latency (0 bubble) for an integer mul or mac feeding into a mac.

> +

> +(define_bypass 1

> +  "falkor_ai_4_vxvy_mul,falkor_ai_4_vxvy_mla,falkor_ai_4_vxvy_vxvy_mul,falkor_ai_4_vxvy_vxvy_mla,falkor_muldiv_4_x_mul,falkor_muldiv_4_x_mla,falkor_muldiv_5_x_mul"

> +  "falkor_ai_4_vxvy_mla,falkor_ai_4_vxvy_vxvy_mla,falkor_muldiv_4_x_mla")

> +

> +;; 3 cycle latency (2 bubbles) for an FP mul or mac feeding into a mac.

> +

> +(define_bypass 3

> +  "falkor_afp_5_vxvy_mul,falkor_afp_5_vxvy_mla,falkor_afp_5_vxvy_vxvy_mul,falkor_afp_5_vxvy_vxvy_mla,falkor_afp_6_vxvy_mul,falkor_afp_6_vxvy_mla,falkor_afp_6_vxvy_vxvy_mul,falkor_afp_6_vxvy_vxvy_mla,falkor_fpdt_5_vxvy_mul,falkor_fpdt_5_vxvy_mla,falkor_fpdt_6_vxvy_mul,falkor_fpdt_6_vxvy_mla"

> +  "falkor_afp_5_vxvy_mla,falkor_afp_5_vxvy_vxvy_mla,falkor_afp_6_vxvy_mla,falkor_afp_6_vxvy_vxvy_mla,falkor_fpdt_5_vxvy_mla,falkor_fpdt_6_vxvy_mla")

>
diff mbox

Patch

diff --git a/gcc/config/aarch64/aarch64-cores.def b/gcc/config/aarch64/aarch64-cores.def
index b8d0ba6..1089332 100644
--- a/gcc/config/aarch64/aarch64-cores.def
+++ b/gcc/config/aarch64/aarch64-cores.def
@@ -65,8 +65,8 @@  AARCH64_CORE("thunderxt83",   thunderxt83,   thunderx,  8A,  AARCH64_FL_FOR_ARCH
 AARCH64_CORE("xgene1",      xgene1,    xgene1,    8A,  AARCH64_FL_FOR_ARCH8, xgene1, 0x50, 0x000, -1)
 
 /* Qualcomm ('Q') cores. */
-AARCH64_CORE("falkor",      falkor,    cortexa57, 8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO | AARCH64_FL_RDMA, qdf24xx,   0x51, 0xC00, -1)
-AARCH64_CORE("qdf24xx",     qdf24xx,   cortexa57, 8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO | AARCH64_FL_RDMA, qdf24xx,   0x51, 0xC00, -1)
+AARCH64_CORE("falkor",      falkor,    falkor,    8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO | AARCH64_FL_RDMA, qdf24xx,   0x51, 0xC00, -1)
+AARCH64_CORE("qdf24xx",     qdf24xx,   falkor,    8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO | AARCH64_FL_RDMA, qdf24xx,   0x51, 0xC00, -1)
 
 /* Samsung ('S') cores. */
 AARCH64_CORE("exynos-m1",   exynosm1,  exynosm1,  8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO, exynosm1,  0x53, 0x001, -1)
diff --git a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md
index fc79947..51061b2 100644
--- a/gcc/config/aarch64/aarch64.md
+++ b/gcc/config/aarch64/aarch64.md
@@ -231,6 +231,7 @@ 
 (include "../arm/cortex-a53.md")
 (include "../arm/cortex-a57.md")
 (include "../arm/exynos-m1.md")
+(include "falkor.md")
 (include "thunderx.md")
 (include "../arm/xgene1.md")
 (include "thunderx2t99.md")
diff --git a/gcc/config/aarch64/falkor.md b/gcc/config/aarch64/falkor.md
new file mode 100644
index 0000000..b422ab3
--- /dev/null
+++ b/gcc/config/aarch64/falkor.md
@@ -0,0 +1,681 @@ 
+;; Falkor pipeline description
+;; Copyright (C) 2017 Free Software Foundation, Inc.
+;;
+;; This file is part of GCC.
+;;
+;; GCC is free software; you can redistribute it and/or modify it
+;; under the terms of the GNU General Public License as published by
+;; the Free Software Foundation; either version 3, or (at your option)
+;; any later version.
+;;
+;; GCC is distributed in the hope that it will be useful, but
+;; WITHOUT ANY WARRANTY; without even the implied warranty of
+;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+;; General Public License for more details.
+;;
+;; You should have received a copy of the GNU General Public License
+;; along with GCC; see the file COPYING3.  If not see
+;; <http://www.gnu.org/licenses/>.
+
+(define_automaton "falkor")
+
+;; Complex int instructions (e.g. multiply and divide) execute in the X
+;; pipeline.  Simple int instructions execute in the X, Y, and Z pipelines.
+
+(define_cpu_unit "falkor_x" "falkor")
+(define_cpu_unit "falkor_y" "falkor")
+(define_cpu_unit "falkor_z" "falkor")
+
+;; Branches execute in the B pipeline or in one of the int pipelines depending
+;; on how complex it is.  Simple int insns (like movz) can also execute here.
+
+(define_cpu_unit "falkor_b" "falkor")
+
+;; Vector and FP insns execute in the VX and VY pipelines.
+
+(define_automaton "falkor_vfp")
+
+(define_cpu_unit "falkor_vx" "falkor_vfp")
+(define_cpu_unit "falkor_vy" "falkor_vfp")
+
+;; Loads execute in the LD pipeline.
+;; Stores execute in the ST, SD, and VSD pipelines, for address, data, and
+;; vector data.
+
+(define_automaton "falkor_mem")
+
+(define_cpu_unit "falkor_ld" "falkor_mem")
+(define_cpu_unit "falkor_st" "falkor_mem")
+(define_cpu_unit "falkor_sd" "falkor_mem")
+(define_cpu_unit "falkor_vsd" "falkor_mem")
+
+;; The GTOV and VTOG pipelines are for general to vector reg moves, and vice
+;; versa.
+
+(define_cpu_unit "falkor_gtov" "falkor")
+(define_cpu_unit "falkor_vtog" "falkor")
+
+;; Common reservation combinations.
+
+(define_reservation "falkor_vxvy" "falkor_vx|falkor_vy")
+(define_reservation "falkor_zb"   "falkor_z|falkor_b")
+(define_reservation "falkor_xyz"  "falkor_x|falkor_y|falkor_z")
+(define_reservation "falkor_xyzb" "falkor_x|falkor_y|falkor_z|falkor_b")
+
+;; SIMD Floating-Point Instructions
+
+(define_insn_reservation "falkor_afp_1_vxvy" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_neg_s,neon_fp_neg_d,neon_fp_abs_s,neon_fp_abs_d"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_1_vxvy_vxvy" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_neg_s_q,neon_fp_neg_d_q,neon_fp_abs_s_q,neon_fp_abs_d_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_2_vxvy" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_minmax_s,neon_fp_minmax_d,neon_fp_reduc_minmax_s,neon_fp_reduc_minmax_d,neon_fp_compare_s,neon_fp_compare_d,neon_fp_round_s,neon_fp_round_d"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_2_vxvy_vxvy" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_minmax_s_q,neon_fp_minmax_d_q,neon_fp_compare_s_q,neon_fp_compare_d_q,neon_fp_round_s_q,neon_fp_round_d_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_3_vxvy" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_reduc_minmax_s_q,neon_fp_reduc_minmax_d_q,neon_fp_abd_s,neon_fp_abd_d,neon_fp_addsub_s,neon_fp_addsub_d,neon_fp_reduc_add_s,neon_fp_reduc_add_d"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_3_vxvy_vxvy" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_abd_s_q,neon_fp_abd_d_q,neon_fp_addsub_s_q,neon_fp_addsub_d_q,neon_fp_reduc_add_s_q,neon_fp_reduc_add_d_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_4_vxvy" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_to_int_s,neon_fp_to_int_d,neon_int_to_fp_s,neon_int_to_fp_d,neon_fp_cvt_widen_h,neon_fp_cvt_widen_s"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_4_vxvy_vxvy" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_to_int_s_q,neon_fp_to_int_d_q,neon_int_to_fp_s_q,neon_int_to_fp_d_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_5_vxvy_mul" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_mul_s,neon_fp_mul_s_scalar"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_5_vxvy_mla" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_mla_s,neon_fp_mla_s_scalar"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_5_vxvy_vxvy_mul" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_mul_s_q,neon_fp_mul_s_scalar_q"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_5_vxvy_vxvy_mla" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_mla_s_q,neon_fp_mla_s_scalar_q"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_6_vxvy_mul" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_mul_d"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_6_vxvy_mla" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_mla_d"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_6_vxvy_vxvy_mul" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_mul_d_q,neon_fp_mul_d_scalar_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_6_vxvy_vxvy_mla" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_mla_d_q,neon_fp_mla_d_scalar_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_4_vxvy_vxvy_vxvy" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_cvt_narrow_s_q,neon_fp_cvt_narrow_d_q"))
+  "falkor_vxvy+falkor_vxvy,falkor_vxvy")
+
+(define_insn_reservation "falkor_afp_6_vx_vy" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_div_s"))
+  "falkor_vx+falkor_vy")
+
+(define_insn_reservation "falkor_afp_11_vx_vy" 11
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_div_d"))
+  "falkor_vx+falkor_vy")
+
+(define_insn_reservation "falkor_afp_6_vx_vy_vx_vy" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_div_s_q"))
+  "(falkor_vx+falkor_vy),(falkor_vx+falkor_vy)")
+
+(define_insn_reservation "falkor_afp_11_vx_vy_vx_vy" 11
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_div_d_q"))
+  "(falkor_vx+falkor_vy),(falkor_vx+falkor_vy)")
+
+(define_insn_reservation "falkor_afp_12_vx_vy" 12
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_sqrt_s"))
+  "falkor_vx+falkor_vy")
+
+(define_insn_reservation "falkor_afp_22_vx_vy" 22
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_sqrt_d"))
+  "falkor_vx+falkor_vy")
+
+(define_insn_reservation "falkor_afp_12_vx_vy_vx_vy" 12
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_sqrt_s_q"))
+  "(falkor_vx+falkor_vy),(falkor_vx+falkor_vy)")
+
+(define_insn_reservation "falkor_afp_22_vx_vy_vx_vy" 22
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_sqrt_d_q"))
+  "(falkor_vx+falkor_vy),(falkor_vx+falkor_vy)")
+
+;; SIMD Integer Instructions
+
+(define_insn_reservation "falkor_ai_1_vxvy" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_add,neon_reduc_add,neon_logic,neon_neg,neon_sub"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_1_vxvy_vxvy" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_shift_imm_long,neon_add_q,neon_reduc_add_q,neon_logic_q,neon_neg_q,neon_sub_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_2_vxvy" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_add_long,neon_sub_long,neon_add_halve,neon_sub_halve,neon_shift_imm,neon_shift_reg,neon_minmax,neon_abs,neon_compare,neon_compare_zero,neon_tst"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_2_vxvy_vxvy" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_add_halve_q,neon_sub_halve_q,neon_shift_imm_q,neon_shift_reg_q,neon_minmax_q,neon_abs_q,neon_compare_q,neon_compare_zero_q,neon_tst_q,neon_reduc_add_long"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_3_vxvy" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_shift_acc,neon_reduc_add_acc,neon_abd,neon_qadd,neon_qsub,neon_qabs,neon_qneg,neon_sat_shift_imm,neon_sat_shift_imm_narrow_q,neon_sat_shift_reg,neon_reduc_minmax"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_4_vxvy" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_reduc_minmax_q"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_3_vxvy_vxvy" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_shift_acc_q,neon_reduc_add_acc_q,neon_abd_q,neon_abd_long,neon_qadd_q,neon_qsub_q,neon_qabs_q,neon_qneg_q,neon_sat_shift_imm_q,neon_sat_shift_reg_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_4_vxvy_mul" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_mul_b,neon_mul_h,neon_mul_s,neon_mul_h_scalar,neon_mul_s_scalar,neon_sat_mul_b,neon_sat_mul_h,neon_sat_mul_s,neon_sat_mul_h_scalar,neon_sat_mul_s_scalar"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_4_vxvy_mla" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_mla_b,neon_mla_h,neon_mla_s,neon_mla_h_scalar,neon_mla_s_scalar"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_4_vxvy_vxvy_mul" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_mul_b_q,neon_mul_h_q,neon_mul_s_q,neon_mul_h_scalar_q,neon_mul_s_scalar_q,neon_sat_mul_b_q,neon_sat_mul_h_q,neon_sat_mul_s_q,neon_mul_b_long,neon_mul_h_long,neon_mul_s_long,neon_mul_d_long,neon_mul_h_scalar_long,neon_mul_s_scalar_long,neon_sat_mul_b_long,neon_sat_mul_h_long,neon_sat_mul_s_long,neon_sat_mul_h_scalar_q,neon_sat_mul_s_scalar_q,neon_sat_mul_h_scalar_long,neon_sat_mul_s_scalar_long"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_4_vxvy_vxvy_mla" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_mla_b_q,neon_mla_h_q,neon_mla_s_q,neon_mla_h_scalar_q,neon_mla_s_scalar_q,neon_mla_b_long,neon_mla_h_long,neon_mla_s_long,neon_mla_h_scalar_long,neon_mla_s_scalar_long,neon_sat_mla_b_long,neon_sat_mla_h_long,neon_sat_mla_s_long,neon_sat_mla_h_scalar_long,neon_sat_mla_s_scalar_long"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_ai_4_vxvy_vxvy" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_add_halve_narrow_q,neon_sub_halve_narrow_q,neon_arith_acc"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_2_ai_vxvy_vxvy_vxvy_vxvy" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_add_widen,neon_sub_widen"))
+  "(falkor_vxvy+falkor_vxvy),(falkor_vxvy+falkor_vxvy)")
+
+(define_insn_reservation "falkor_4_ai_vxvy_vxvy_vxvy_vxvy" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_arith_acc_q"))
+  "(falkor_vxvy+falkor_vxvy),(falkor_vxvy+falkor_vxvy)")
+
+;; SIMD Load Instructions
+
+(define_insn_reservation "falkor_ald_4_ld" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_load1_1reg,neon_load1_1reg_q,neon_load1_all_lanes,neon_load2_one_lane"))
+  "falkor_ld")
+
+(define_insn_reservation "falkor_ald_4_ld_none" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_load1_2reg,neon_load2_2reg,neon_load2_all_lanes"))
+  "falkor_ld")
+
+(define_insn_reservation "falkor_ald_4_ld_ld" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_load1_2reg_q,neon_load2_2reg_q,neon_load2_all_lanes_q,neon_load3_one_lane,neon_load4_one_lane,neon_ldp,neon_ldp_q"))
+  "falkor_ld,falkor_ld")
+
+(define_insn_reservation "falkor_ald_4_ld_ld_none" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_load1_3reg,neon_load3_3reg,neon_load3_all_lanes"))
+  "falkor_ld,falkor_ld")
+
+(define_insn_reservation "falkor_ald_4_ld_ld_ld" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_load1_3reg_q,neon_load3_3reg_q,neon_load3_all_lanes_q"))
+  "falkor_ld,falkor_ld,falkor_ld")
+
+(define_insn_reservation "falkor_ald_4_ld_ld_none_none" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_load1_4reg,neon_load4_4reg"))
+  "falkor_ld,falkor_ld")
+
+(define_insn_reservation "falkor_ald_4_ld_ld_ld_ld" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_load1_4reg_q,neon_load4_4reg_q,neon_load4_all_lanes,neon_load4_all_lanes_q"))
+  "falkor_ld,falkor_ld,falkor_ld,falkor_ld")
+
+;; Arithmetic and Logical Instructions
+
+(define_insn_reservation "falkor_alu_1_xyz" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "alus_sreg,alus_imm,alus_shift_imm,csel,adc_reg,alu_imm,alu_sreg,alu_shift_imm,alu_ext,alus_ext,logic_imm,logic_reg,logic_shift_imm,logics_imm,logics_reg,logics_shift_imm,mov_reg"))
+  "falkor_xyz")
+
+;; SIMD Miscellaneous Instructions
+
+;; No separate type for ins and dup.  But this is correct for both.
+
+(define_insn_reservation "falkor_am_3_gtov" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_from_gp"))
+  "falkor_gtov")
+
+;; No separate type for ins and dup.  Assuming dup is more common.  Ins is
+;; gtov+vxvy and latency of 4.
+
+(define_insn_reservation "falkor_am_3_gtov_gtov" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_from_gp_q"))
+  "falkor_gtov,falkor_gtov")
+
+;; neon_to_gp_q is used for 32-bit ARM instructions that move 64-bits of data
+;; so no use needed here.
+
+(define_insn_reservation "falkor_am_3_vtog" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_to_gp"))
+  "falkor_vtog")
+
+(define_insn_reservation "falkor_am_1_vxvy" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_bsl,neon_dup,neon_ext,neon_ins,neon_ins_q,neon_move,neon_rev,neon_tbl1,neon_permute,neon_shift_imm_narrow_q"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_am_1_vxvy_vxvy" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_bsl_q,neon_dup_q,neon_ext_q,neon_move_q,neon_rev_q,neon_tbl1_q,neon_permute_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_am_2_vxvy" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_cls,neon_cnt,neon_rbit"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_am_4_vxvy_vxvy" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_cls_q,neon_cnt_q,neon_rbit_q,neon_tbl2"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_am_3_vxvy" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_recpe_s,neon_fp_recpe_d,neon_fp_rsqrte_s,neon_fp_rsqrte_d,neon_fp_recpx_s,neon_fp_recpx_d"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_am_3_vxvy_vxvy" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_recpe_s_q,neon_fp_recpe_d_q,neon_fp_rsqrte_s_q,neon_fp_rsqrte_d_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_am_5_vxvy" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_recps_s"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_am_5_vxvy_vxvy" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_recps_s_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_am_6_vxvy" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_recps_d,neon_fp_rsqrts_d"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_am_6_vxvy_vxvy" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_fp_recps_d_q,neon_fp_rsqrts_d_q"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_am_5_vxvy_vxvy_vxvy" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_tbl2_q,neon_tbl3"))
+  "(falkor_vxvy+falkor_vxvy),falkor_vxvy")
+
+(define_insn_reservation "falkor_am_6_vxvy_vxvy_vxvy_vxvy" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_tbl3_q,neon_tbl4"))
+  "(falkor_vxvy+falkor_vxvy),(falkor_vxvy+falkor_vxvy)")
+
+(define_insn_reservation "falkor_am_7_vxvy_vxvy_vxvy_vxvy_vxvy" 7
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_tbl4_q"))
+  "(falkor_vxvy+falkor_vxvy),(falkor_vxvy+falkor_vxvy),falkor_vxvy")
+
+;; SIMD Store Instructions
+
+;; ??? stp is neon_store1_2reg in aarch64.md, but neon_stp in aarch64-simd.md.
+;; Similarly with ldp.
+
+(define_insn_reservation "falkor_ast_st_vsd" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_store1_1reg,neon_store1_1reg_q,neon_store1_one_lane,neon_store1_one_lane_q,neon_store1_2reg,neon_store2_2reg,neon_store2_one_lane,neon_store2_one_lane_q,neon_stp"))
+  "falkor_st+falkor_vsd")
+
+(define_insn_reservation "falkor_as_0_st_vsd_st_vsd" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_store1_2reg_q,neon_store1_3reg,neon_store1_4reg,neon_store2_2reg_q,neon_store3_3reg,neon_store4_4reg,neon_store3_one_lane,neon_store3_one_lane_q,neon_store4_one_lane,neon_store4_one_lane_q,neon_stp_q"))
+  "(falkor_st+falkor_vsd),(falkor_st+falkor_vsd)")
+
+(define_insn_reservation "falkor_as_0_st_vsd_st_vsd_st_vsd" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_store1_3reg_q,neon_store3_3reg_q"))
+  "(falkor_st+falkor_vsd),(falkor_st+falkor_vsd),(falkor_st+falkor_vsd)")
+
+(define_insn_reservation "falkor_as_0_st_vsd_st_vsd_st_vsd_st_vsd" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "neon_store1_4reg_q,neon_store4_4reg_q"))
+  "(falkor_st+falkor_vsd),(falkor_st+falkor_vsd),(falkor_st+falkor_vsd),(falkor_st+falkor_vsd)")
+
+;; Branch Instructions
+
+(define_insn_reservation "falkor_branch_0_zb" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "branch"))
+  "falkor_zb")
+
+(define_insn_reservation "falkor_call_0_xyzb" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "call"))
+  "falkor_xyzb")
+
+;; Cryptography Extensions
+
+(define_insn_reservation "falkor_cry_1_vxvy" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "crypto_sha1_fast"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_cry_2_vxvy" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "crypto_aesmc"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_cry_2_vxvy_vxvy" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "crypto_sha1_xor,crypto_sha256_fast,crypto_pmull"))
+  "falkor_vxvy+falkor_vxvy")
+
+(define_insn_reservation "falkor_cry_4_vy_vx" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "crypto_sha1_slow"))
+  "falkor_vy+falkor_vx")
+
+(define_insn_reservation "falkor_cry_6_vy_vx" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "crypto_sha256_slow"))
+  "falkor_vy+falkor_vx")
+
+(define_insn_reservation "falkor_cry_3_vxvy_vxvy" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "crypto_aese"))
+  "falkor_vxvy+falkor_vxvy")
+
+;; FP Load Instructions
+
+(define_insn_reservation "falkor_fld_4_ld" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "f_loads,f_loadd"))
+  "falkor_ld")
+
+;; No separate FP store section, these are found in the SIMD store section.
+
+(define_insn_reservation "falkor_fld_0_st_vsd" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "f_stores,f_stored"))
+  "falkor_st+falkor_vsd")
+
+;; FP Data Processing Instructions
+
+(define_insn_reservation "falkor_fpdt_0_vxvy" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fcmps,fcmpd,fccmps,fccmpd"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_fpdt_5_vtog" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "f_cvtf2i"))
+  "falkor_vtog")
+
+(define_insn_reservation "falkor_fpdt_1_vxvy" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "ffariths,ffarithd,fcsel"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_fpdt_2_vxvy" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "f_minmaxd,f_minmaxs,f_rintd,f_rints"))
+  "falkor_vxvy")
+
+;; Scalar FP ABD is handled same as vector FP ABD.
+
+(define_insn_reservation "falkor_fpdt_3_vxvy" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "faddd,fadds"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_fpdt_4_vxvy" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "f_cvt"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_fpdt_5_vxvy_mul" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fmuls"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_fpdt_5_vxvy_mla" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fmacs,ffmas"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_fpdt_6_vxvy_mul" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fmuld"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_fpdt_6_vxvy_mla" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fmacd,ffmad"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_fpdt_6_vx_vy" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fdivs"))
+  "falkor_vx+falkor_vy")
+
+(define_insn_reservation "falkor_fpdt_11_vx_vy" 11
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fdivd"))
+  "falkor_vx+falkor_vy")
+
+(define_insn_reservation "falkor_fpdt_12_vx_vy" 12
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fsqrts"))
+  "falkor_vxvy")
+
+(define_insn_reservation "falkor_fpdt_22_vx_vy" 22
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fsqrtd"))
+  "falkor_vxvy")
+
+;; FP Miscellaneous Instructions
+
+(define_insn_reservation "falkor_fpmsc_3_vtog" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "f_mrc"))
+  "falkor_vtog")
+
+(define_insn_reservation "falkor_fpmsc_3_gtov" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "f_mcr"))
+  "falkor_gtov")
+
+(define_insn_reservation "falkor_fpmsc_1_vxvy" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "fmov,fconsts,fconstd"))
+  "falkor_vxvy")
+
+;; No separate type for float-to-fixed conversions.  Same type as
+;; float-to-int conversions.  They schedule the same though, so no problem.
+
+(define_insn_reservation "falkor_fpmsc_6_gtov" 6
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "f_cvti2f"))
+  "falkor_gtov")
+
+;; Load Instructions
+
+(define_insn_reservation "falkor_ld_3_ld" 3
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "load1,load2"))
+  "falkor_ld")
+
+;; Miscellaneous Data-Processing Instructions
+
+(define_insn_reservation "falkor_misc_1_xyz" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "bfx,bfm,extend,rotate_imm,shift_imm"))
+  "falkor_xyz")
+
+(define_insn_reservation "falkor_misc_2_x" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "crc"))
+  "falkor_x")
+
+(define_insn_reservation "falkor_misc_2_xyz" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "clz,rbit,rev"))
+  "falkor_xyz")
+
+;; Divide and Multiply Instructions
+
+(define_insn_reservation "falkor_muldiv_4_x_mul" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "mul"))
+  "falkor_x")
+
+(define_insn_reservation "falkor_muldiv_4_x_mla" 4
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "mla,smlal,umlal"))
+  "falkor_x")
+
+(define_insn_reservation "falkor_muldiv_5_x_mul" 5
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "smull,umull"))
+  "falkor_x")
+
+(define_insn_reservation "falkor_md_11_x_z" 11
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "sdiv,udiv"))
+  "falkor_x+falkor_z")
+
+;; Move and Shift Instructions
+
+(define_insn_reservation "falkor_mvs_1_xyz" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "mov_imm,shift_reg"))
+  "falkor_xyz")
+
+(define_insn_reservation "falkor_mvs_1_xyzb" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "adr"))
+  "falkor_xyzb")
+
+;; Other Instructions
+
+;; Block is for instruction scheduling blockage insns in RTL.  There are no
+;; hardware instructions emitted for them, so don't use any resources.
+
+(define_insn_reservation "falkor_other_0_nothing" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "no_insn,trap,block"))
+  "nothing")
+
+(define_insn_reservation "falkor_other_2_z" 2
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "mrs"))
+  "falkor_z")
+
+;; Assume multiple instructions use all pipes.
+
+(define_insn_reservation "falkor_extra" 1
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "multiple"))
+  "falkor_x+falkor_y+falkor_z+falkor_b+falkor_vx+falkor_vy+falkor_ld+falkor_st+falkor_sd+falkor_vsd+falkor_gtov+falkor_vtog")
+
+;; Store Instructions
+
+;; No use of store_rel, store3, or store4 in aarch64.
+
+(define_insn_reservation "falkor_st_0_st_sd" 0
+  (and (eq_attr "tune" "falkor")
+       (eq_attr "type" "store1,store2"))
+  "falkor_st+falkor_sd")
+
+;; Muliply bypasses.
+
+;; 1 cycle latency (0 bubble) for an integer mul or mac feeding into a mac.
+
+(define_bypass 1
+  "falkor_ai_4_vxvy_mul,falkor_ai_4_vxvy_mla,falkor_ai_4_vxvy_vxvy_mul,falkor_ai_4_vxvy_vxvy_mla,falkor_muldiv_4_x_mul,falkor_muldiv_4_x_mla,falkor_muldiv_5_x_mul"
+  "falkor_ai_4_vxvy_mla,falkor_ai_4_vxvy_vxvy_mla,falkor_muldiv_4_x_mla")
+
+;; 3 cycle latency (2 bubbles) for an FP mul or mac feeding into a mac.
+
+(define_bypass 3
+  "falkor_afp_5_vxvy_mul,falkor_afp_5_vxvy_mla,falkor_afp_5_vxvy_vxvy_mul,falkor_afp_5_vxvy_vxvy_mla,falkor_afp_6_vxvy_mul,falkor_afp_6_vxvy_mla,falkor_afp_6_vxvy_vxvy_mul,falkor_afp_6_vxvy_vxvy_mla,falkor_fpdt_5_vxvy_mul,falkor_fpdt_5_vxvy_mla,falkor_fpdt_6_vxvy_mul,falkor_fpdt_6_vxvy_mla"
+  "falkor_afp_5_vxvy_mla,falkor_afp_5_vxvy_vxvy_mla,falkor_afp_6_vxvy_mla,falkor_afp_6_vxvy_vxvy_mla,falkor_fpdt_5_vxvy_mla,falkor_fpdt_6_vxvy_mla")