Skip to content

Commit fe23ed2

Browse files
committed
AMDGPU: Temporary drop s_mul_hi_i/u32 patterns
It introduces performance regressions in several applications. This has already been submitted downstream. llvm-svn: 361879
1 parent 1468991 commit fe23ed2

File tree

2 files changed

+2
-11
lines changed

2 files changed

+2
-11
lines changed

llvm/lib/Target/AMDGPU/SOPInstructions.td

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -558,12 +558,8 @@ let SubtargetPredicate = isGFX9Plus in {
558558
def S_LSHL4_ADD_U32 : SOP2_32<"s_lshl4_add_u32">;
559559
} // End Defs = [SCC]
560560

561-
let isCommutable = 1 in {
562-
def S_MUL_HI_U32 : SOP2_32<"s_mul_hi_u32",
563-
[(set i32:$sdst, (UniformBinFrag<mulhu> SSrc_b32:$src0, SSrc_b32:$src1))]>;
564-
def S_MUL_HI_I32 : SOP2_32<"s_mul_hi_i32",
565-
[(set i32:$sdst, (UniformBinFrag<mulhs> SSrc_b32:$src0, SSrc_b32:$src1))]>;
566-
}
561+
def S_MUL_HI_U32 : SOP2_32<"s_mul_hi_u32">;
562+
def S_MUL_HI_I32 : SOP2_32<"s_mul_hi_i32">;
567563
} // End SubtargetPredicate = isGFX9Plus
568564

569565
//===----------------------------------------------------------------------===//

llvm/test/CodeGen/AMDGPU/mul.ll

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -141,11 +141,6 @@ define amdgpu_kernel void @v_mul_i32(i32 addrspace(1)* %out, i32 addrspace(1)* %
141141
; crash with a 'failed to select' error.
142142

143143
; FUNC-LABEL: {{^}}s_mul_i64:
144-
; GFX9_10-DAG: s_mul_i32
145-
; GFX9_10-DAG: s_mul_hi_u32
146-
; GFX9_10-DAG: s_mul_i32
147-
; GFX9_10-DAG: s_mul_i32
148-
; GFX9_10: s_endpgm
149144
define amdgpu_kernel void @s_mul_i64(i64 addrspace(1)* %out, i64 %a, i64 %b) nounwind {
150145
%mul = mul i64 %a, %b
151146
store i64 %mul, i64 addrspace(1)* %out, align 8

0 commit comments

Comments
 (0)