target/loongarch: Add estimated reciprocal instructions

author Jiajie Chen <c@jia.je>

Wed, 19 Nov 2025 12:30:55 +0000 (20:30 +0800)

committer Song Gao <gaosong@loongson.cn>

Tue, 10 Feb 2026 02:48:20 +0000 (10:48 +0800)
author Jiajie Chen <c@jia.je>
Wed, 19 Nov 2025 12:30:55 +0000 (20:30 +0800)
committer Song Gao <gaosong@loongson.cn>
Tue, 10 Feb 2026 02:48:20 +0000 (10:48 +0800)
diff --git a/target/loongarch/cpu.h b/target/loongarch/cpu.h

index a518541c54549e7b40f0b0b86da2bb55ff79c6ec..8648d0514a269d6d971b97638d76fd752d5c5dda 100644 (file)
--- a/target/loongarch/cpu.h
+++ b/target/loongarch/cpu.h
@@ -138,6 +138,7 @@ FIELD(CPUCFG2, LBT_ALL, 18, 3)
  FIELD(CPUCFG2, LSPW, 21, 1)
  FIELD(CPUCFG2, LAM, 22, 1)
  FIELD(CPUCFG2, HPTW, 24, 1)
+FIELD(CPUCFG2, FRECIPE, 25, 1)
  FIELD(CPUCFG2, LAM_BH, 27, 1)
  FIELD(CPUCFG2, LAMCAS, 28, 1)
  
diff --git a/target/loongarch/disas.c b/target/loongarch/disas.c

index 66c0cae5a9dc22eb8882fed16ace63824a234952..e5e1b37ce026f8deded156f775047d8b827524d7 100644 (file)
--- a/target/loongarch/disas.c
+++ b/target/loongarch/disas.c
@@ -478,6 +478,10 @@ INSN(frecip_s,     ff)
  INSN(frecip_d,     ff)
  INSN(frsqrt_s,     ff)
  INSN(frsqrt_d,     ff)
+INSN(frecipe_s,    ff)
+INSN(frecipe_d,    ff)
+INSN(frsqrte_s,    ff)
+INSN(frsqrte_d,    ff)
  INSN(fmov_s,       ff)
  INSN(fmov_d,       ff)
  INSN(movgr2fr_w,   fr)
@@ -1429,6 +1433,10 @@ INSN_LSX(vfrecip_s,        vv)
  INSN_LSX(vfrecip_d,        vv)
  INSN_LSX(vfrsqrt_s,        vv)
  INSN_LSX(vfrsqrt_d,        vv)
+INSN_LSX(vfrecipe_s,       vv)
+INSN_LSX(vfrecipe_d,       vv)
+INSN_LSX(vfrsqrte_s,       vv)
+INSN_LSX(vfrsqrte_d,       vv)
  
  INSN_LSX(vfcvtl_s_h,       vv)
  INSN_LSX(vfcvth_s_h,       vv)
@@ -2343,6 +2351,10 @@ INSN_LASX(xvfrecip_s,        vv)
  INSN_LASX(xvfrecip_d,        vv)
  INSN_LASX(xvfrsqrt_s,        vv)
  INSN_LASX(xvfrsqrt_d,        vv)
+INSN_LASX(xvfrecipe_s,       vv)
+INSN_LASX(xvfrecipe_d,       vv)
+INSN_LASX(xvfrsqrte_s,       vv)
+INSN_LASX(xvfrsqrte_d,       vv)
  
  INSN_LASX(xvfcvtl_s_h,       vv)
  INSN_LASX(xvfcvth_s_h,       vv)
diff --git a/target/loongarch/insns.decode b/target/loongarch/insns.decode

index cf4123cd463f59fe3bc91edc1933cdb0bd0554a6..92078f0f9fa9fde2aa680007989955f66a76c158 100644 (file)
--- a/target/loongarch/insns.decode
+++ b/target/loongarch/insns.decode
@@ -371,6 +371,10 @@ frecip_s        0000 00010001 01000 10101 ..... .....    @ff
  frecip_d        0000 00010001 01000 10110 ..... .....    @ff
  frsqrt_s        0000 00010001 01000 11001 ..... .....    @ff
  frsqrt_d        0000 00010001 01000 11010 ..... .....    @ff
+frecipe_s       0000 00010001 01000 11101 ..... .....    @ff
+frecipe_d       0000 00010001 01000 11110 ..... .....    @ff
+frsqrte_s       0000 00010001 01001 00001 ..... .....    @ff
+frsqrte_d       0000 00010001 01001 00010 ..... .....    @ff
  fscaleb_s       0000 00010001 00001 ..... ..... .....    @fff
  fscaleb_d       0000 00010001 00010 ..... ..... .....    @fff
  flogb_s         0000 00010001 01000 01001 ..... .....    @ff
@@ -1115,6 +1119,10 @@ vfrecip_s        0111 00101001 11001 11101 ..... .....    @vv
  vfrecip_d        0111 00101001 11001 11110 ..... .....    @vv
  vfrsqrt_s        0111 00101001 11010 00001 ..... .....    @vv
  vfrsqrt_d        0111 00101001 11010 00010 ..... .....    @vv
+vfrecipe_s       0111 00101001 11010 00101 ..... .....    @vv
+vfrecipe_d       0111 00101001 11010 00110 ..... .....    @vv
+vfrsqrte_s       0111 00101001 11010 01001 ..... .....    @vv
+vfrsqrte_d       0111 00101001 11010 01010 ..... .....    @vv
  
  vfcvtl_s_h       0111 00101001 11011 11010 ..... .....    @vv
  vfcvth_s_h       0111 00101001 11011 11011 ..... .....    @vv
@@ -1879,6 +1887,10 @@ xvfrecip_s       0111 01101001 11001 11101 ..... .....    @vv
  xvfrecip_d       0111 01101001 11001 11110 ..... .....    @vv
  xvfrsqrt_s       0111 01101001 11010 00001 ..... .....    @vv
  xvfrsqrt_d       0111 01101001 11010 00010 ..... .....    @vv
+xvfrecipe_s      0111 01101001 11010 00101 ..... .....    @vv
+xvfrecipe_d      0111 01101001 11010 00110 ..... .....    @vv
+xvfrsqrte_s      0111 01101001 11010 01001 ..... .....    @vv
+xvfrsqrte_d      0111 01101001 11010 01010 ..... .....    @vv
  
  xvfcvtl_s_h      0111 01101001 11011 11010 ..... .....    @vv
  xvfcvth_s_h      0111 01101001 11011 11011 ..... .....    @vv
diff --git a/target/loongarch/tcg/insn_trans/trans_farith.c.inc b/target/loongarch/tcg/insn_trans/trans_farith.c.inc

index ff6cf3448e725972072005dafbf976d2adea6e98..eed6ab7312505674ffe8132029b82e2eecda30d7 100644 (file)
--- a/target/loongarch/tcg/insn_trans/trans_farith.c.inc
+++ b/target/loongarch/tcg/insn_trans/trans_farith.c.inc
@@ -191,6 +191,10 @@ TRANS(frecip_s, FP_SP, gen_ff, gen_helper_frecip_s)
  TRANS(frecip_d, FP_DP, gen_ff, gen_helper_frecip_d)
  TRANS(frsqrt_s, FP_SP, gen_ff, gen_helper_frsqrt_s)
  TRANS(frsqrt_d, FP_DP, gen_ff, gen_helper_frsqrt_d)
+TRANS(frecipe_s, FRECIPE_FP_SP, gen_ff, gen_helper_frecip_s)
+TRANS(frecipe_d, FRECIPE_FP_DP, gen_ff, gen_helper_frecip_d)
+TRANS(frsqrte_s, FRECIPE_FP_SP, gen_ff, gen_helper_frsqrt_s)
+TRANS(frsqrte_d, FRECIPE_FP_DP, gen_ff, gen_helper_frsqrt_d)
  TRANS64(flogb_s, FP_SP, gen_ff, gen_helper_flogb_s)
  TRANS64(flogb_d, FP_DP, gen_ff, gen_helper_flogb_d)
  TRANS(fclass_s, FP_SP, gen_ff, gen_helper_fclass_s)
diff --git a/target/loongarch/tcg/insn_trans/trans_vec.c.inc b/target/loongarch/tcg/insn_trans/trans_vec.c.inc

index ea7e705bab4e3916b4d4c92b503ae3a835503acb..195b89f78834b208f0ba83930b844e792dc488b6 100644 (file)
--- a/target/loongarch/tcg/insn_trans/trans_vec.c.inc
+++ b/target/loongarch/tcg/insn_trans/trans_vec.c.inc
@@ -4407,12 +4407,20 @@ TRANS(vfrecip_s, LSX, gen_vv_ptr, gen_helper_vfrecip_s)
  TRANS(vfrecip_d, LSX, gen_vv_ptr, gen_helper_vfrecip_d)
  TRANS(vfrsqrt_s, LSX, gen_vv_ptr, gen_helper_vfrsqrt_s)
  TRANS(vfrsqrt_d, LSX, gen_vv_ptr, gen_helper_vfrsqrt_d)
+TRANS(vfrecipe_s, FRECIPE_LSX, gen_vv_ptr, gen_helper_vfrecip_s)
+TRANS(vfrecipe_d, FRECIPE_LSX, gen_vv_ptr, gen_helper_vfrecip_d)
+TRANS(vfrsqrte_s, FRECIPE_LSX, gen_vv_ptr, gen_helper_vfrsqrt_s)
+TRANS(vfrsqrte_d, FRECIPE_LSX, gen_vv_ptr, gen_helper_vfrsqrt_d)
  TRANS(xvfsqrt_s, LASX, gen_xx_ptr, gen_helper_vfsqrt_s)
  TRANS(xvfsqrt_d, LASX, gen_xx_ptr, gen_helper_vfsqrt_d)
  TRANS(xvfrecip_s, LASX, gen_xx_ptr, gen_helper_vfrecip_s)
  TRANS(xvfrecip_d, LASX, gen_xx_ptr, gen_helper_vfrecip_d)
  TRANS(xvfrsqrt_s, LASX, gen_xx_ptr, gen_helper_vfrsqrt_s)
  TRANS(xvfrsqrt_d, LASX, gen_xx_ptr, gen_helper_vfrsqrt_d)
+TRANS(xvfrecipe_s, FRECIPE_LASX, gen_xx_ptr, gen_helper_vfrecip_s)
+TRANS(xvfrecipe_d, FRECIPE_LASX, gen_xx_ptr, gen_helper_vfrecip_d)
+TRANS(xvfrsqrte_s, FRECIPE_LASX, gen_xx_ptr, gen_helper_vfrsqrt_s)
+TRANS(xvfrsqrte_d, FRECIPE_LASX, gen_xx_ptr, gen_helper_vfrsqrt_d)
  
  TRANS(vfcvtl_s_h, LSX, gen_vv_ptr, gen_helper_vfcvtl_s_h)
  TRANS(vfcvth_s_h, LSX, gen_vv_ptr, gen_helper_vfcvth_s_h)
diff --git a/target/loongarch/translate.h b/target/loongarch/translate.h

index 9ba3b425c1a993e23f34d7bce3a2cbfed9cae614..331f79c8f2ac58fe785471a47063d9b0dcea5657 100644 (file)
--- a/target/loongarch/translate.h
+++ b/target/loongarch/translate.h
@@ -33,6 +33,12 @@
  #define avail_IOCSR(C)  (FIELD_EX32((C)->cpucfg1, CPUCFG1, IOCSR))
  #define avail_CRC(C)    (FIELD_EX32((C)->cpucfg1, CPUCFG1, CRC))
  
+#define avail_FRECIPE(C) (FIELD_EX32((C)->cpucfg2, CPUCFG2, FRECIPE))
+#define avail_FRECIPE_FP_SP(C) (avail_FRECIPE(C) && avail_FP_SP(C))
+#define avail_FRECIPE_FP_DP(C) (avail_FRECIPE(C) && avail_FP_DP(C))
+#define avail_FRECIPE_LSX(C)   (avail_FRECIPE(C) && avail_LSX(C))
+#define avail_FRECIPE_LASX(C)   (avail_FRECIPE(C) && avail_LASX(C))
+
  /*
   * If an operation is being performed on less than TARGET_LONG_BITS,
   * it may require the inputs to be sign- or zero-extended; which will
author	Jiajie Chen <c@jia.je>
	Wed, 19 Nov 2025 12:30:55 +0000 (20:30 +0800)
committer	Song Gao <gaosong@loongson.cn>
	Tue, 10 Feb 2026 02:48:20 +0000 (10:48 +0800)
target/loongarch/cpu.h		patch \| blob \| blame \| history
target/loongarch/disas.c		patch \| blob \| blame \| history
target/loongarch/insns.decode		patch \| blob \| blame \| history
target/loongarch/tcg/insn_trans/trans_farith.c.inc		patch \| blob \| blame \| history
target/loongarch/tcg/insn_trans/trans_vec.c.inc		patch \| blob \| blame \| history
target/loongarch/translate.h		patch \| blob \| blame \| history