Merging r266825: (4ed8a4ea) · Commits · llvm-doe / llvm-project

llvm/lib/Target/AMDGPU/SIInstrInfo.cpp

+3 −3

Original line number	Diff line number	Diff line
		@@ -917,10 +917,10 @@ MachineInstr SIInstrInfo::commuteInstructionImpl(MachineInstr MI,
		MachineOperand &Src1 = MI->getOperand(Src1Idx);


		if (isVOP2(*MI)) {
		if (isVOP2(MI) \|\| isVOPC(MI)) {
		const MCInstrDesc &InstrDesc = MI->getDesc();
		// For VOP2 instructions, any operand type is valid to use for src0. Make
		// sure we can use the src1 as src0.
		// For VOP2 and VOPC instructions, any operand type is valid to use for
		// src0. Make sure we can use the src0 as src1.
		//
		// We could be stricter here and only allow commuting if there is a reason
		// to do so. i.e. if both operands are VGPRs there is no real benefit,

0 → 100644

+50 −0

Original line number	Diff line number	Diff line
		; RUN: llc < %s -march=amdgcn -mcpu=verde -verify-machineinstrs \| FileCheck %s
		; RUN: llc < %s -march=amdgcn -mcpu=tonga -verify-machineinstrs \| FileCheck %s

		target triple = "amdgcn--"

		; CHECK-LABEL: {{^}}main:
		;
		; Test for compilation only. This generated an invalid machine instruction
		; by trying to commute the operands of a V_CMP_EQ_i32_e32 instruction, both
		; of which were in SGPRs.
		define float @main(i32 %v) #2 {
		main_body:
		%d1 = call float @llvm.SI.load.const(<16 x i8> undef, i32 960)
		%d2 = call float @llvm.SI.load.const(<16 x i8> undef, i32 976)
		br i1 undef, label %ENDIF56, label %IF57

		IF57: ; preds = %ENDIF
		%v.1 = mul i32 %v, 2
		br label %ENDIF56

		ENDIF56: ; preds = %IF57, %ENDIF
		%v.2 = phi i32 [ %v, %main_body ], [ %v.1, %IF57 ]
		%d1.i = bitcast float %d1 to i32
		%cc1 = icmp eq i32 %d1.i, 0
		br i1 %cc1, label %ENDIF59, label %IF60

		IF60: ; preds = %ENDIF56
		%v.3 = mul i32 %v.2, 2
		br label %ENDIF59

		ENDIF59: ; preds = %IF60, %ENDIF56
		%v.4 = phi i32 [ %v.2, %ENDIF56 ], [ %v.3, %IF60 ]
		%d2.i = bitcast float %d2 to i32
		%cc2 = icmp eq i32 %d2.i, 0
		br i1 %cc2, label %ENDIF62, label %IF63

		IF63: ; preds = %ENDIF59
		unreachable

		ENDIF62: ; preds = %ENDIF59
		%r = bitcast i32 %v.4 to float
		ret float %r
		}

		; Function Attrs: nounwind readnone
		declare float @llvm.SI.load.const(<16 x i8>, i32) #0

		attributes #0 = { nounwind readnone }
		attributes #1 = { readnone }
		attributes #2 = { "ShaderType"="1" }