From af4fb245e12f2dd8e2c32167c9acfaceb4b6af6a Mon Sep 17 00:00:00 2001
From: Hongyu Wang <hongyu.wang@intel.com>
Date: Fri, 17 Jan 2025 09:04:17 +0800
Subject: [PATCH] i386: Fix wrong insn generated by shld/shrd ndd split
 [PR118510]

For shld/shrd_ndd_2 insn, the spiltter outputs wrong pattern that
mixed parallel for clobber and set. Use register_operand as dest
and ajdust output template to fix.

gcc/ChangeLog:

	PR target/118510
	* config/i386/i386.md (*x86_64_shld_ndd_2): Use register_operand
	for operand[0] and adjust the output template to directly
	generate ndd form shld pattern.
	(*x86_shld_ndd_2): Likewise.
	(*x86_64_shrd_ndd_2): Likewise.
	(*x86_shrd_ndd_2): Likewise.

gcc/testsuite/ChangeLog:

	PR target/118510
	* gcc.target/i386/pr118510.c: New test.
---
 gcc/config/i386/i386.md                  | 44 +++++++-----------------
 gcc/testsuite/gcc.target/i386/pr118510.c | 14 ++++++++
 2 files changed, 26 insertions(+), 32 deletions(-)
 create mode 100644 gcc/testsuite/gcc.target/i386/pr118510.c

diff --git a/gcc/config/i386/i386.md b/gcc/config/i386/i386.md
index 5fbd0848df5b..c977e86b72e8 100644
--- a/gcc/config/i386/i386.md
+++ b/gcc/config/i386/i386.md
@@ -15596,7 +15596,7 @@
 	      (clobber (reg:CC FLAGS_REG))])])
 
 (define_insn_and_split "*x86_64_shld_ndd_2"
-  [(set (match_operand:DI 0 "nonimmediate_operand")
+  [(set (match_operand:DI 0 "register_operand")
 	(ior:DI (ashift:DI (match_operand:DI 1 "nonimmediate_operand")
 			   (match_operand:QI 3 "nonmemory_operand"))
 		(lshiftrt:DI (match_operand:DI 2 "register_operand")
@@ -15606,7 +15606,7 @@
    && ix86_pre_reload_split ()"
   "#"
   "&& 1"
-  [(parallel [(set (match_dup 4)
+  [(parallel [(set (match_dup 0)
 		   (ior:DI (ashift:DI (match_dup 1)
 				      (and:QI (match_dup 3) (const_int 63)))
 			   (subreg:DI
@@ -15615,12 +15615,7 @@
 				 (minus:QI (const_int 64)
 					   (and:QI (match_dup 3)
 						   (const_int 63)))) 0)))
-	      (clobber (reg:CC FLAGS_REG))
-	      (set (match_dup 0) (match_dup 4))])]
-{
-  operands[4] = gen_reg_rtx (DImode);
-  emit_move_insn (operands[4], operands[0]);
-})
+	      (clobber (reg:CC FLAGS_REG))])])
 
 (define_insn "x86_shld<nf_name>"
   [(set (match_operand:SI 0 "nonimmediate_operand" "+r*m")
@@ -15832,7 +15827,7 @@
 	      (clobber (reg:CC FLAGS_REG))])])
 
 (define_insn_and_split "*x86_shld_ndd_2"
-  [(set (match_operand:SI 0 "nonimmediate_operand")
+  [(set (match_operand:SI 0 "register_operand")
 	(ior:SI (ashift:SI (match_operand:SI 1 "nonimmediate_operand")
 			   (match_operand:QI 3 "nonmemory_operand"))
 		(lshiftrt:SI (match_operand:SI 2 "register_operand")
@@ -15842,7 +15837,7 @@
    && ix86_pre_reload_split ()"
   "#"
   "&& 1"
-  [(parallel [(set (match_dup 4)
+  [(parallel [(set (match_dup 0)
 		   (ior:SI (ashift:SI (match_dup 1)
 				      (and:QI (match_dup 3) (const_int 31)))
 			   (subreg:SI
@@ -15851,12 +15846,7 @@
 				 (minus:QI (const_int 32)
 					   (and:QI (match_dup 3)
 						   (const_int 31)))) 0)))
-	      (clobber (reg:CC FLAGS_REG))
-	      (set (match_dup 0) (match_dup 4))])]
-{
-  operands[4] = gen_reg_rtx (SImode);
-  emit_move_insn (operands[4], operands[0]);
-})
+	      (clobber (reg:CC FLAGS_REG))])])
 
 (define_expand "@x86_shift<mode>_adj_1"
   [(set (reg:CCZ FLAGS_REG)
@@ -16991,7 +16981,7 @@
 	      (clobber (reg:CC FLAGS_REG))])])
 
 (define_insn_and_split "*x86_64_shrd_ndd_2"
-  [(set (match_operand:DI 0 "nonimmediate_operand")
+  [(set (match_operand:DI 0 "register_operand")
 	(ior:DI (lshiftrt:DI (match_operand:DI 1 "nonimmediate_operand")
 			     (match_operand:QI 3 "nonmemory_operand"))
 		(ashift:DI (match_operand:DI 2 "register_operand")
@@ -17001,7 +16991,7 @@
   && ix86_pre_reload_split ()"
   "#"
   "&& 1"
-  [(parallel [(set (match_dup 4)
+  [(parallel [(set (match_dup 0)
 		   (ior:DI (lshiftrt:DI (match_dup 1)
 					(and:QI (match_dup 3) (const_int 63)))
 			   (subreg:DI
@@ -17010,12 +17000,7 @@
 				 (minus:QI (const_int 64)
 					   (and:QI (match_dup 3)
 						   (const_int 63)))) 0)))
-	      (clobber (reg:CC FLAGS_REG))
-	      (set (match_dup 0) (match_dup 4))])]
-{
-  operands[4] = gen_reg_rtx (DImode);
-  emit_move_insn (operands[4], operands[0]);
-})
+	      (clobber (reg:CC FLAGS_REG))])])
 
 (define_insn "x86_shrd<nf_name>"
   [(set (match_operand:SI 0 "nonimmediate_operand" "+r*m")
@@ -17226,7 +17211,7 @@
 	      (clobber (reg:CC FLAGS_REG))])])
 
 (define_insn_and_split "*x86_shrd_ndd_2"
-  [(set (match_operand:SI 0 "nonimmediate_operand")
+  [(set (match_operand:SI 0 "register_operand")
 	(ior:SI (lshiftrt:SI (match_operand:SI 1 "nonimmediate_operand")
 			   (match_operand:QI 3 "nonmemory_operand"))
 		(ashift:SI (match_operand:SI 2 "register_operand")
@@ -17236,7 +17221,7 @@
    && ix86_pre_reload_split ()"
   "#"
   "&& 1"
-  [(parallel [(set (match_dup 4)
+  [(parallel [(set (match_dup 0)
 		   (ior:SI (lshiftrt:SI (match_dup 1)
 				        (and:QI (match_dup 3) (const_int 31)))
 			   (subreg:SI
@@ -17245,12 +17230,7 @@
 				 (minus:QI (const_int 32)
 					   (and:QI (match_dup 3)
 						   (const_int 31)))) 0)))
-	      (clobber (reg:CC FLAGS_REG))
-	      (set (match_dup 0) (match_dup 4))])]
-{
-  operands[4] = gen_reg_rtx (SImode);
-  emit_move_insn (operands[4], operands[0]);
-})
+	      (clobber (reg:CC FLAGS_REG))])])
 
 ;; Base name for insn mnemonic.
 (define_mode_attr cvt_mnemonic
diff --git a/gcc/testsuite/gcc.target/i386/pr118510.c b/gcc/testsuite/gcc.target/i386/pr118510.c
new file mode 100644
index 000000000000..6cfe8182b6f2
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr118510.c
@@ -0,0 +1,14 @@
+/* { dg-do compile { target { ! ia32 } } } */
+/* { dg-options "-O2 -mapxf" } */
+
+typedef struct cpp_num cpp_num;
+struct cpp_num {
+    int high;
+    unsigned low;
+    int overflow;
+};
+int num_rshift_n;
+cpp_num num_lshift(cpp_num num) {
+    num.low = num.low >> num_rshift_n | num.high << (32 - num_rshift_n);
+    return num;
+}
-- 
GitLab